ccid3.c 35.9 KB
Newer Older
1 2 3 4
/*
 *  net/dccp/ccids/ccid3.c
 *
 *  Copyright (c) 2005 The University of Waikato, Hamilton, New Zealand.
5
 *  Copyright (c) 2005-6 Ian McDonald <ian.mcdonald@jandi.co.nz>
6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38
 *
 *  An implementation of the DCCP protocol
 *
 *  This code has been developed by the University of Waikato WAND
 *  research group. For further information please see http://www.wand.net.nz/
 *
 *  This code also uses code from Lulea University, rereleased as GPL by its
 *  authors:
 *  Copyright (c) 2003 Nils-Erik Mattsson, Joacim Haggmark, Magnus Erixzon
 *
 *  Changes to meet Linux coding standards, to make it meet latest ccid3 draft
 *  and to make it work as a loadable module in the DCCP stack written by
 *  Arnaldo Carvalho de Melo <acme@conectiva.com.br>.
 *
 *  Copyright (c) 2005 Arnaldo Carvalho de Melo <acme@conectiva.com.br>
 *
 *  This program is free software; you can redistribute it and/or modify
 *  it under the terms of the GNU General Public License as published by
 *  the Free Software Foundation; either version 2 of the License, or
 *  (at your option) any later version.
 *
 *  This program is distributed in the hope that it will be useful,
 *  but WITHOUT ANY WARRANTY; without even the implied warranty of
 *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 *  GNU General Public License for more details.
 *
 *  You should have received a copy of the GNU General Public License
 *  along with this program; if not, write to the Free Software
 *  Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
 */

#include "../ccid.h"
#include "../dccp.h"
39
#include "lib/packet_history.h"
40
#include "lib/loss_interval.h"
41
#include "lib/tfrc.h"
42 43
#include "ccid3.h"

44
/*
45 46
 * Reason for maths here is to avoid 32 bit overflow when a is big.
 * With this we get close to the limit.
47
 */
48
static u32 usecs_div(const u32 a, const u32 b)
49
{
50 51 52 53 54 55 56 57 58 59 60
	const u32 div = a < (UINT_MAX / (USEC_PER_SEC /    10)) ?    10 :
			a < (UINT_MAX / (USEC_PER_SEC /    50)) ?    50 :
			a < (UINT_MAX / (USEC_PER_SEC /   100)) ?   100 :
			a < (UINT_MAX / (USEC_PER_SEC /   500)) ?   500 :
			a < (UINT_MAX / (USEC_PER_SEC /  1000)) ?  1000 :
			a < (UINT_MAX / (USEC_PER_SEC /  5000)) ?  5000 :
			a < (UINT_MAX / (USEC_PER_SEC / 10000)) ? 10000 :
			a < (UINT_MAX / (USEC_PER_SEC / 50000)) ? 50000 :
								 100000;
	const u32 tmp = a * (USEC_PER_SEC / div);
	return (b >= 2 * div) ? tmp / (b / div) : tmp;
61 62
}

63

64 65 66 67

#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
static int ccid3_debug;
#define ccid3_pr_debug(format, a...)	DCCP_PR_DEBUG(ccid3_debug, format, ##a)
68 69 70 71
#else
#define ccid3_pr_debug(format, a...)
#endif

72 73
static struct dccp_tx_hist *ccid3_tx_hist;
static struct dccp_rx_hist *ccid3_rx_hist;
74
static struct dccp_li_hist *ccid3_li_hist;
75

76
#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
77 78 79 80 81 82 83 84 85 86 87 88 89
static const char *ccid3_tx_state_name(enum ccid3_hc_tx_states state)
{
	static char *ccid3_state_names[] = {
	[TFRC_SSTATE_NO_SENT]  = "NO_SENT",
	[TFRC_SSTATE_NO_FBACK] = "NO_FBACK",
	[TFRC_SSTATE_FBACK]    = "FBACK",
	[TFRC_SSTATE_TERM]     = "TERM",
	};

	return ccid3_state_names[state];
}
#endif

90 91
static void ccid3_hc_tx_set_state(struct sock *sk,
				  enum ccid3_hc_tx_states state)
92
{
93
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
94 95 96
	enum ccid3_hc_tx_states oldstate = hctx->ccid3hctx_state;

	ccid3_pr_debug("%s(%p) %-8.8s -> %s\n",
97 98
		       dccp_role(sk), sk, ccid3_tx_state_name(oldstate),
		       ccid3_tx_state_name(state));
99 100 101 102 103 104 105
	WARN_ON(state == oldstate);
	hctx->ccid3hctx_state = state;
}

/* Calculate new t_ipi (inter packet interval) by t_ipi = s / X_inst */
static inline void ccid3_calc_new_t_ipi(struct ccid3_hc_tx_sock *hctx)
{
106
	hctx->ccid3hctx_t_ipi = usecs_div(hctx->ccid3hctx_s, hctx->ccid3hctx_x);
107 108 109 110 111
}

/* Calculate new delta by delta = min(t_ipi / 2, t_gran / 2) */
static inline void ccid3_calc_new_delta(struct ccid3_hc_tx_sock *hctx)
{
112 113
	hctx->ccid3hctx_delta = min_t(u32, hctx->ccid3hctx_t_ipi / 2,
					   TFRC_OPSYS_HALF_TIME_GRAN);
114 115 116 117 118 119 120 121 122 123 124 125 126 127
}

/*
 * Update X by
 *    If (p > 0)
 *       x_calc = calcX(s, R, p);
 *       X = max(min(X_calc, 2 * X_recv), s / t_mbi);
 *    Else
 *       If (now - tld >= R)
 *          X = max(min(2 * X, 2 * X_recv), s / R);
 *          tld = now;
 */ 
static void ccid3_hc_tx_update_x(struct sock *sk)
{
128
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
129

130 131
	/* To avoid large error in calcX */
	if (hctx->ccid3hctx_p >= TFRC_SMALLEST_P) {
132 133 134
		hctx->ccid3hctx_x_calc = tfrc_calc_x(hctx->ccid3hctx_s,
						     hctx->ccid3hctx_rtt,
						     hctx->ccid3hctx_p);
135 136 137 138
		hctx->ccid3hctx_x = max_t(u32, min_t(u32, hctx->ccid3hctx_x_calc,
							  2 * hctx->ccid3hctx_x_recv),
					       (hctx->ccid3hctx_s /
					        TFRC_MAX_BACK_OFF_TIME));
139 140 141
	} else {
		struct timeval now;

142
		dccp_timestamp(sk, &now);
143 144
	       	if (timeval_delta(&now, &hctx->ccid3hctx_t_ld) >=
		    hctx->ccid3hctx_rtt) {
145 146 147 148
			hctx->ccid3hctx_x = max_t(u32, min_t(u32, hctx->ccid3hctx_x_recv,
								  hctx->ccid3hctx_x) * 2,
						       usecs_div(hctx->ccid3hctx_s,
							       	 hctx->ccid3hctx_rtt));
149 150
			hctx->ccid3hctx_t_ld = now;
		}
151 152 153 154 155 156 157
	}
}

static void ccid3_hc_tx_no_feedback_timer(unsigned long data)
{
	struct sock *sk = (struct sock *)data;
	unsigned long next_tmout = 0;
158
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
159 160 161 162 163

	bh_lock_sock(sk);
	if (sock_owned_by_user(sk)) {
		/* Try again later. */
		/* XXX: set some sensible MIB */
164 165
		sk_reset_timer(sk, &hctx->ccid3hctx_no_feedback_timer,
			       jiffies + HZ / 5);
166 167 168 169 170 171 172 173 174 175
		goto out;
	}

	ccid3_pr_debug("%s, sk=%p, state=%s\n", dccp_role(sk), sk,
		       ccid3_tx_state_name(hctx->ccid3hctx_state));
	
	switch (hctx->ccid3hctx_state) {
	case TFRC_SSTATE_NO_FBACK:
		/* Halve send rate */
		hctx->ccid3hctx_x /= 2;
176 177
		if (hctx->ccid3hctx_x < (hctx->ccid3hctx_s /
					 TFRC_MAX_BACK_OFF_TIME))
178 179
			hctx->ccid3hctx_x = (hctx->ccid3hctx_s /
					     TFRC_MAX_BACK_OFF_TIME);
180

181 182 183 184
		ccid3_pr_debug("%s, sk=%p, state=%s, updated tx rate to %d "
			       "bytes/s\n",
			       dccp_role(sk), sk,
			       ccid3_tx_state_name(hctx->ccid3hctx_state),
185
			       hctx->ccid3hctx_x);
186 187
		next_tmout = max_t(u32, 2 * usecs_div(hctx->ccid3hctx_s,
						      hctx->ccid3hctx_x),
188 189 190 191 192 193
					TFRC_INITIAL_TIMEOUT);
		/*
		 * FIXME - not sure above calculation is correct. See section
		 * 5 of CCID3 11 should adjust tx_t_ipi and double that to
		 * achieve it really
		 */
194 195
		break;
	case TFRC_SSTATE_FBACK:
196 197 198 199 200
		/*
		 * Check if IDLE since last timeout and recv rate is less than
		 * 4 packets per RTT
		 */
		if (!hctx->ccid3hctx_idle ||
201 202
		    (hctx->ccid3hctx_x_recv >=
		     4 * usecs_div(hctx->ccid3hctx_s, hctx->ccid3hctx_rtt))) {
203 204
			ccid3_pr_debug("%s, sk=%p, state=%s, not idle\n",
				       dccp_role(sk), sk,
205 206 207 208 209 210 211 212
				       ccid3_tx_state_name(hctx->ccid3hctx_state));
			/* Halve sending rate */

			/*  If (X_calc > 2 * X_recv)
			 *    X_recv = max(X_recv / 2, s / (2 * t_mbi));
			 *  Else
			 *    X_recv = X_calc / 4;
			 */
213 214
			BUG_ON(hctx->ccid3hctx_p >= TFRC_SMALLEST_P &&
			       hctx->ccid3hctx_x_calc == 0);
215 216 217 218 219 220 221 222 223 224 225 226

			/* check also if p is zero -> x_calc is infinity? */
			if (hctx->ccid3hctx_p < TFRC_SMALLEST_P ||
			    hctx->ccid3hctx_x_calc > 2 * hctx->ccid3hctx_x_recv)
				hctx->ccid3hctx_x_recv = max_t(u32, hctx->ccid3hctx_x_recv / 2,
								    hctx->ccid3hctx_s / (2 * TFRC_MAX_BACK_OFF_TIME));
			else
				hctx->ccid3hctx_x_recv = hctx->ccid3hctx_x_calc / 4;

			/* Update sending rate */
			ccid3_hc_tx_update_x(sk);
		}
227 228 229 230
		/*
		 * Schedule no feedback timer to expire in
		 * max(4 * R, 2 * s / X)
		 */
231
		next_tmout = max_t(u32, hctx->ccid3hctx_t_rto, 
232 233
					2 * usecs_div(hctx->ccid3hctx_s,
						      hctx->ccid3hctx_x));
234
		break;
235 236 237 238
	case TFRC_SSTATE_NO_SENT:
		DCCP_BUG("Illegal %s state NO_SENT, sk=%p", dccp_role(sk), sk);
		/* fall through */
	case TFRC_SSTATE_TERM:
239 240 241 242
		goto out;
	}

	sk_reset_timer(sk, &hctx->ccid3hctx_no_feedback_timer, 
243
		      jiffies + max_t(u32, 1, usecs_to_jiffies(next_tmout)));
244 245 246 247 248 249
	hctx->ccid3hctx_idle = 1;
out:
	bh_unlock_sock(sk);
	sock_put(sk);
}

250 251
static int ccid3_hc_tx_send_packet(struct sock *sk,
				   struct sk_buff *skb, int len)
252 253
{
	struct dccp_sock *dp = dccp_sk(sk);
254
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
255
	struct dccp_tx_hist_entry *new_packet;
256
	struct timeval now;
257
	long delay;
258 259
	int rc = -ENOTCONN;

260
	BUG_ON(hctx == NULL);
261

262
	/* Check if pure ACK or Terminating*/
263
	/*
264 265
	 * XXX: We only call this function for DATA and DATAACK, on, these
	 * packets can have zero length, but why the comment about "pure ACK"?
266
	 */
267
	if (unlikely(len == 0))
268 269 270
		goto out;

	/* See if last packet allocated was not sent */
271 272
	new_packet = dccp_tx_hist_head(&hctx->ccid3hctx_hist);
	if (new_packet == NULL || new_packet->dccphtx_sent) {
273 274
		new_packet = dccp_tx_hist_entry_new(ccid3_tx_hist,
						    SLAB_ATOMIC);
275 276

		rc = -ENOBUFS;
277
		if (unlikely(new_packet == NULL)) {
278 279
			DCCP_WARN("%s, sk=%p, not enough mem to add to history,"
				  "send refused\n", dccp_role(sk), sk);
280 281 282
			goto out;
		}

283
		dccp_tx_hist_add_entry(&hctx->ccid3hctx_hist, new_packet);
284 285
	}

286
	dccp_timestamp(sk, &now);
287 288 289

	switch (hctx->ccid3hctx_state) {
	case TFRC_SSTATE_NO_SENT:
290 291
		sk_reset_timer(sk, &hctx->ccid3hctx_no_feedback_timer,
			       jiffies + usecs_to_jiffies(TFRC_INITIAL_TIMEOUT));
292 293 294 295
		hctx->ccid3hctx_last_win_count	 = 0;
		hctx->ccid3hctx_t_last_win_count = now;
		ccid3_hc_tx_set_state(sk, TFRC_SSTATE_NO_FBACK);

296 297 298 299 300 301
		/* First timeout, according to [RFC 3448, 4.2], is 1 second */
		hctx->ccid3hctx_t_ipi = USEC_PER_SEC;
		/* Initial delta: minimum of 0.5 sec and t_gran/2 */
		hctx->ccid3hctx_delta = TFRC_OPSYS_HALF_TIME_GRAN;

		/* Set t_0 for initial packet */
302 303 304 305 306
		hctx->ccid3hctx_t_nom = now;
		rc = 0;
		break;
	case TFRC_SSTATE_NO_FBACK:
	case TFRC_SSTATE_FBACK:
307 308 309 310 311 312 313 314 315 316 317 318 319
		delay = timeval_delta(&hctx->ccid3hctx_t_nom, &now);
		/*
		 * 	Scheduling of packet transmissions [RFC 3448, 4.6]
		 *
		 * if (t_now > t_nom - delta)
		 *       // send the packet now
		 * else
		 *       // send the packet in (t_nom - t_now) milliseconds.
		 */
		if (delay < hctx->ccid3hctx_delta)
			rc = 0;
		else
			rc = delay/1000L;
320
		break;
321 322
	case TFRC_SSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
323 324 325 326 327
		rc = -EINVAL;
		break;
	}

	/* Can we send? if so add options and add to packet history */
328 329
	if (rc == 0) {
		dp->dccps_hc_tx_insert_options = 1;
330
		new_packet->dccphtx_ccval =
331 332
			DCCP_SKB_CB(skb)->dccpd_ccval =
				hctx->ccid3hctx_last_win_count;
I
Ian McDonald 已提交
333 334
		timeval_add_usecs(&hctx->ccid3hctx_t_nom,
				  hctx->ccid3hctx_t_ipi);
335
	}
336 337 338 339 340 341
out:
	return rc;
}

static void ccid3_hc_tx_packet_sent(struct sock *sk, int more, int len)
{
342 343
	const struct dccp_sock *dp = dccp_sk(sk);
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
344 345
	struct timeval now;

346
	BUG_ON(hctx == NULL);
347

348
	dccp_timestamp(sk, &now);
349 350 351 352

	/* check if we have sent a data packet */
	if (len > 0) {
		unsigned long quarter_rtt;
353
		struct dccp_tx_hist_entry *packet;
354

355
		packet = dccp_tx_hist_head(&hctx->ccid3hctx_hist);
356
		if (unlikely(packet == NULL)) {
357
			DCCP_WARN("packet doesn't exist in history!\n");
358 359
			return;
		}
360
		if (unlikely(packet->dccphtx_sent)) {
361
			DCCP_WARN("no unsent packet in history!\n");
362 363
			return;
		}
364 365
		packet->dccphtx_tstamp = now;
		packet->dccphtx_seqno  = dp->dccps_gss;
366
		/*
367
		 * Check if win_count have changed
368
		 * Algorithm in "8.1. Window Counter Value" in RFC 4342.
369
		 */
370 371 372 373
		quarter_rtt = timeval_delta(&now, &hctx->ccid3hctx_t_last_win_count);
		if (likely(hctx->ccid3hctx_rtt > 8))
			quarter_rtt /= hctx->ccid3hctx_rtt / 4;

374 375 376 377
		if (quarter_rtt > 0) {
			hctx->ccid3hctx_t_last_win_count = now;
			hctx->ccid3hctx_last_win_count	 = (hctx->ccid3hctx_last_win_count +
							    min_t(unsigned long, quarter_rtt, 5)) % 16;
378 379
			ccid3_pr_debug("%s, sk=%p, window changed from "
				       "%u to %u!\n",
380
				       dccp_role(sk), sk,
381
				       packet->dccphtx_ccval,
382 383
				       hctx->ccid3hctx_last_win_count);
		}
384

385
		hctx->ccid3hctx_idle = 0;
386
		packet->dccphtx_rtt  = hctx->ccid3hctx_rtt;
387
		packet->dccphtx_sent = 1;
388 389 390 391 392 393 394 395
	} else
		ccid3_pr_debug("%s, sk=%p, seqno=%llu NOT inserted!\n",
			       dccp_role(sk), sk, dp->dccps_gss);

	switch (hctx->ccid3hctx_state) {
	case TFRC_SSTATE_NO_SENT:
		/* if first wasn't pure ack */
		if (len != 0)
396 397
			DCCP_CRIT("%s, First packet sent is noted "
				  "as a data packet",  dccp_role(sk));
398 399
		return;
	case TFRC_SSTATE_NO_FBACK:
400 401
		/* t_nom, t_ipi, delta do not change until feedback arrives */
		return;
402 403
	case TFRC_SSTATE_FBACK:
		if (len > 0) {
I
Ian McDonald 已提交
404 405
			timeval_sub_usecs(&hctx->ccid3hctx_t_nom,
				  hctx->ccid3hctx_t_ipi);
406 407
			ccid3_calc_new_t_ipi(hctx);
			ccid3_calc_new_delta(hctx);
408 409
			timeval_add_usecs(&hctx->ccid3hctx_t_nom,
					  hctx->ccid3hctx_t_ipi);
410 411
		}
		break;
412 413
	case TFRC_SSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
414 415 416 417 418 419
		break;
	}
}

static void ccid3_hc_tx_packet_recv(struct sock *sk, struct sk_buff *skb)
{
420 421
	const struct dccp_sock *dp = dccp_sk(sk);
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
422
	struct ccid3_options_received *opt_recv;
423
	struct dccp_tx_hist_entry *packet;
424
	struct timeval now;
425
	unsigned long next_tmout; 
I
Ian McDonald 已提交
426
	u32 t_elapsed;
427 428 429
	u32 pinv;
	u32 x_recv;
	u32 r_sample;
430

431
	BUG_ON(hctx == NULL);
432 433 434 435 436 437 438 439

	/* we are only interested in ACKs */
	if (!(DCCP_SKB_CB(skb)->dccpd_type == DCCP_PKT_ACK ||
	      DCCP_SKB_CB(skb)->dccpd_type == DCCP_PKT_DATAACK))
		return;

	opt_recv = &hctx->ccid3hctx_options_received;

440
	t_elapsed = dp->dccps_options_received.dccpor_elapsed_time * 10;
441 442 443 444 445 446 447 448 449 450 451 452
	x_recv = opt_recv->ccid3or_receive_rate;
	pinv = opt_recv->ccid3or_loss_event_rate;

	switch (hctx->ccid3hctx_state) {
	case TFRC_SSTATE_NO_SENT:
		/* FIXME: what to do here? */
		return;
	case TFRC_SSTATE_NO_FBACK:
	case TFRC_SSTATE_FBACK:
		/* Calculate new round trip sample by
		 * R_sample = (now - t_recvdata) - t_delay */
		/* get t_recvdata from history */
453 454
		packet = dccp_tx_hist_find_entry(&hctx->ccid3hctx_hist,
						 DCCP_SKB_CB(skb)->dccpd_ack_seq);
455
		if (unlikely(packet == NULL)) {
456 457
			DCCP_WARN("%s, sk=%p, seqno %llu(%s) does't exist "
				  "in history!\n",  dccp_role(sk), sk,
458
			    (unsigned long long)DCCP_SKB_CB(skb)->dccpd_ack_seq,
459
				  dccp_packet_name(DCCP_SKB_CB(skb)->dccpd_type));
460 461 462 463
			return;
		}

		/* Update RTT */
464 465
		dccp_timestamp(sk, &now);
		r_sample = timeval_delta(&now, &packet->dccphtx_tstamp);
466
		if (unlikely(r_sample <= t_elapsed))
467 468
			DCCP_WARN("r_sample=%uus,t_elapsed=%uus\n",
				  r_sample, t_elapsed);
469 470
		else
			r_sample -= t_elapsed;
471 472 473 474 475 476 477 478 479 480 481 482 483

		/* Update RTT estimate by 
		 * If (No feedback recv)
		 *    R = R_sample;
		 * Else
		 *    R = q * R + (1 - q) * R_sample;
		 *
		 * q is a constant, RFC 3448 recomments 0.9
		 */
		if (hctx->ccid3hctx_state == TFRC_SSTATE_NO_FBACK) {
			ccid3_hc_tx_set_state(sk, TFRC_SSTATE_FBACK);
			hctx->ccid3hctx_rtt = r_sample;
		} else
484 485
			hctx->ccid3hctx_rtt = (hctx->ccid3hctx_rtt * 9) / 10 +
					      r_sample / 10;
486

487 488 489
		ccid3_pr_debug("%s, sk=%p, New RTT estimate=%uus, "
			       "r_sample=%us\n", dccp_role(sk), sk,
			       hctx->ccid3hctx_rtt, r_sample);
490 491

		/* Update timeout interval */
492 493
		hctx->ccid3hctx_t_rto = max_t(u32, 4 * hctx->ccid3hctx_rtt,
					      USEC_PER_SEC);
494 495

		/* Update receive rate */
496
		hctx->ccid3hctx_x_recv = x_recv;/* X_recv in bytes per sec */
497 498 499 500 501 502 503 504 505

		/* Update loss event rate */
		if (pinv == ~0 || pinv == 0)
			hctx->ccid3hctx_p = 0;
		else {
			hctx->ccid3hctx_p = 1000000 / pinv;

			if (hctx->ccid3hctx_p < TFRC_SMALLEST_P) {
				hctx->ccid3hctx_p = TFRC_SMALLEST_P;
506 507
				ccid3_pr_debug("%s, sk=%p, Smallest p used!\n",
					       dccp_role(sk), sk);
508 509 510 511 512 513 514 515 516 517
			}
		}

		/* unschedule no feedback timer */
		sk_stop_timer(sk, &hctx->ccid3hctx_no_feedback_timer);

		/* Update sending rate */
		ccid3_hc_tx_update_x(sk);

		/* Update next send time */
518 519
		timeval_sub_usecs(&hctx->ccid3hctx_t_nom,
				  hctx->ccid3hctx_t_ipi);
520
		ccid3_calc_new_t_ipi(hctx);
521 522
		timeval_add_usecs(&hctx->ccid3hctx_t_nom,
				  hctx->ccid3hctx_t_ipi);
523 524 525
		ccid3_calc_new_delta(hctx);

		/* remove all packets older than the one acked from history */
526 527
		dccp_tx_hist_purge_older(ccid3_tx_hist,
					 &hctx->ccid3hctx_hist, packet);
528 529 530 531 532
		/*
		 * As we have calculated new ipi, delta, t_nom it is possible that
		 * we now can send a packet, so wake up dccp_wait_for_ccids.
		 */
		sk->sk_write_space(sk);
533

534 535 536 537
		/*
		 * Schedule no feedback timer to expire in
		 * max(4 * R, 2 * s / X)
		 */
538
		next_tmout = max(hctx->ccid3hctx_t_rto,
539 540 541
				 2 * usecs_div(hctx->ccid3hctx_s,
					       hctx->ccid3hctx_x));
			
542 543 544 545
		ccid3_pr_debug("%s, sk=%p, Scheduled no feedback timer to "
			       "expire in %lu jiffies (%luus)\n",
			       dccp_role(sk), sk,
			       usecs_to_jiffies(next_tmout), next_tmout); 
546 547

		sk_reset_timer(sk, &hctx->ccid3hctx_no_feedback_timer, 
548
			       jiffies + max_t(u32, 1, usecs_to_jiffies(next_tmout)));
549 550 551 552

		/* set idle flag */
		hctx->ccid3hctx_idle = 1;   
		break;
553 554
	case TFRC_SSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
555 556 557 558
		break;
	}
}

559
static int ccid3_hc_tx_insert_options(struct sock *sk, struct sk_buff *skb)
560
{
561
	const struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
562

563 564
	BUG_ON(hctx == NULL);

565 566 567
	if (sk->sk_state == DCCP_OPEN || sk->sk_state == DCCP_PARTOPEN)
		DCCP_SKB_CB(skb)->dccpd_ccval = hctx->ccid3hctx_last_win_count;
	return 0;
568 569 570
}

static int ccid3_hc_tx_parse_options(struct sock *sk, unsigned char option,
571 572
				     unsigned char len, u16 idx,
				     unsigned char *value)
573 574
{
	int rc = 0;
575 576
	const struct dccp_sock *dp = dccp_sk(sk);
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
577 578
	struct ccid3_options_received *opt_recv;

579
	BUG_ON(hctx == NULL);
580 581 582 583 584 585 586 587 588 589 590 591 592

	opt_recv = &hctx->ccid3hctx_options_received;

	if (opt_recv->ccid3or_seqno != dp->dccps_gsr) {
		opt_recv->ccid3or_seqno		     = dp->dccps_gsr;
		opt_recv->ccid3or_loss_event_rate    = ~0;
		opt_recv->ccid3or_loss_intervals_idx = 0;
		opt_recv->ccid3or_loss_intervals_len = 0;
		opt_recv->ccid3or_receive_rate	     = 0;
	}

	switch (option) {
	case TFRC_OPT_LOSS_EVENT_RATE:
593
		if (unlikely(len != 4)) {
594 595 596
			DCCP_WARN("%s, sk=%p, invalid len %d "
				  "for TFRC_OPT_LOSS_EVENT_RATE\n",
				  dccp_role(sk), sk, len);
597 598
			rc = -EINVAL;
		} else {
599
			opt_recv->ccid3or_loss_event_rate = ntohl(*(__be32 *)value);
600 601 602 603 604 605 606 607 608 609 610 611 612 613
			ccid3_pr_debug("%s, sk=%p, LOSS_EVENT_RATE=%u\n",
				       dccp_role(sk), sk,
				       opt_recv->ccid3or_loss_event_rate);
		}
		break;
	case TFRC_OPT_LOSS_INTERVALS:
		opt_recv->ccid3or_loss_intervals_idx = idx;
		opt_recv->ccid3or_loss_intervals_len = len;
		ccid3_pr_debug("%s, sk=%p, LOSS_INTERVALS=(%u, %u)\n",
			       dccp_role(sk), sk,
			       opt_recv->ccid3or_loss_intervals_idx,
			       opt_recv->ccid3or_loss_intervals_len);
		break;
	case TFRC_OPT_RECEIVE_RATE:
614
		if (unlikely(len != 4)) {
615 616 617
			DCCP_WARN("%s, sk=%p, invalid len %d "
				  "for TFRC_OPT_RECEIVE_RATE\n",
				  dccp_role(sk), sk, len);
618 619
			rc = -EINVAL;
		} else {
620
			opt_recv->ccid3or_receive_rate = ntohl(*(__be32 *)value);
621 622 623 624 625 626 627 628 629 630
			ccid3_pr_debug("%s, sk=%p, RECEIVE_RATE=%u\n",
				       dccp_role(sk), sk,
				       opt_recv->ccid3or_receive_rate);
		}
		break;
	}

	return rc;
}

631
static int ccid3_hc_tx_init(struct ccid *ccid, struct sock *sk)
632 633
{
	struct dccp_sock *dp = dccp_sk(sk);
634
	struct ccid3_hc_tx_sock *hctx = ccid_priv(ccid);
635

636 637 638
	if (dp->dccps_packet_size >= TFRC_MIN_PACKET_SIZE &&
	    dp->dccps_packet_size <= TFRC_MAX_PACKET_SIZE)
		hctx->ccid3hctx_s = dp->dccps_packet_size;
639 640 641
	else
		hctx->ccid3hctx_s = TFRC_STD_PACKET_SIZE;

642 643
	/* Set transmission rate to 1 packet per second */
	hctx->ccid3hctx_x     = hctx->ccid3hctx_s;
644
	hctx->ccid3hctx_t_rto = USEC_PER_SEC;
645 646
	hctx->ccid3hctx_state = TFRC_SSTATE_NO_SENT;
	INIT_LIST_HEAD(&hctx->ccid3hctx_hist);
647 648 649

	hctx->ccid3hctx_no_feedback_timer.function = ccid3_hc_tx_no_feedback_timer;
	hctx->ccid3hctx_no_feedback_timer.data     = (unsigned long)sk;
650 651 652 653 654 655 656
	init_timer(&hctx->ccid3hctx_no_feedback_timer);

	return 0;
}

static void ccid3_hc_tx_exit(struct sock *sk)
{
657
	struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
658 659 660 661 662 663 664

	BUG_ON(hctx == NULL);

	ccid3_hc_tx_set_state(sk, TFRC_SSTATE_TERM);
	sk_stop_timer(sk, &hctx->ccid3hctx_no_feedback_timer);

	/* Empty packet history */
665
	dccp_tx_hist_purge(ccid3_tx_hist, &hctx->ccid3hctx_hist);
666 667 668 669 670 671
}

/*
 * RX Half Connection methods
 */

672
#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
673 674 675 676 677 678 679 680 681 682 683 684
static const char *ccid3_rx_state_name(enum ccid3_hc_rx_states state)
{
	static char *ccid3_rx_state_names[] = {
	[TFRC_RSTATE_NO_DATA] = "NO_DATA",
	[TFRC_RSTATE_DATA]    = "DATA",
	[TFRC_RSTATE_TERM]    = "TERM",
	};

	return ccid3_rx_state_names[state];
}
#endif

685 686
static void ccid3_hc_rx_set_state(struct sock *sk,
				  enum ccid3_hc_rx_states state)
687
{
688
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
689 690 691
	enum ccid3_hc_rx_states oldstate = hcrx->ccid3hcrx_state;

	ccid3_pr_debug("%s(%p) %-8.8s -> %s\n",
692 693
		       dccp_role(sk), sk, ccid3_rx_state_name(oldstate),
		       ccid3_rx_state_name(state));
694 695 696 697 698 699
	WARN_ON(state == oldstate);
	hcrx->ccid3hcrx_state = state;
}

static void ccid3_hc_rx_send_feedback(struct sock *sk)
{
700
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
701
	struct dccp_sock *dp = dccp_sk(sk);
702
	struct dccp_rx_hist_entry *packet;
703
	struct timeval now;
704 705 706

	ccid3_pr_debug("%s, sk=%p\n", dccp_role(sk), sk);

707
	dccp_timestamp(sk, &now);
708

709 710 711 712 713
	switch (hcrx->ccid3hcrx_state) {
	case TFRC_RSTATE_NO_DATA:
		hcrx->ccid3hcrx_x_recv = 0;
		break;
	case TFRC_RSTATE_DATA: {
714 715
		const u32 delta = timeval_delta(&now,
					&hcrx->ccid3hcrx_tstamp_last_feedback);
716 717
		hcrx->ccid3hcrx_x_recv = usecs_div(hcrx->ccid3hcrx_bytes_recv,
						   delta);
718 719
	}
		break;
720 721
	case TFRC_RSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
722 723 724
		return;
	}

725
	packet = dccp_rx_hist_find_data_packet(&hcrx->ccid3hcrx_hist);
726
	if (unlikely(packet == NULL)) {
727 728
		DCCP_WARN("%s, sk=%p, no data packet in history!\n",
			  dccp_role(sk), sk);
729 730 731
		return;
	}

732
	hcrx->ccid3hcrx_tstamp_last_feedback = now;
I
Ian McDonald 已提交
733
	hcrx->ccid3hcrx_ccval_last_counter   = packet->dccphrx_ccval;
734 735 736
	hcrx->ccid3hcrx_bytes_recv	     = 0;

	/* Convert to multiples of 10us */
737 738
	hcrx->ccid3hcrx_elapsed_time =
			timeval_delta(&now, &packet->dccphrx_tstamp) / 10;
739 740 741 742
	if (hcrx->ccid3hcrx_p == 0)
		hcrx->ccid3hcrx_pinv = ~0;
	else
		hcrx->ccid3hcrx_pinv = 1000000 / hcrx->ccid3hcrx_p;
743
	dp->dccps_hc_rx_insert_options = 1;
744 745 746
	dccp_send_ack(sk);
}

747
static int ccid3_hc_rx_insert_options(struct sock *sk, struct sk_buff *skb)
748
{
749
	const struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
750
	__be32 x_recv, pinv;
751

752 753 754
	BUG_ON(hcrx == NULL);

	if (!(sk->sk_state == DCCP_OPEN || sk->sk_state == DCCP_PARTOPEN))
755
		return 0;
756

I
Ian McDonald 已提交
757
	DCCP_SKB_CB(skb)->dccpd_ccval = hcrx->ccid3hcrx_ccval_last_counter;
758 759

	if (dccp_packet_without_ack(skb))
760 761
		return 0;

762 763
	x_recv = htonl(hcrx->ccid3hcrx_x_recv);
	pinv   = htonl(hcrx->ccid3hcrx_pinv);
764 765 766 767 768 769 770 771 772 773 774 775

	if ((hcrx->ccid3hcrx_elapsed_time != 0 &&
	     dccp_insert_option_elapsed_time(sk, skb,
					     hcrx->ccid3hcrx_elapsed_time)) ||
	    dccp_insert_option_timestamp(sk, skb) ||
	    dccp_insert_option(sk, skb, TFRC_OPT_LOSS_EVENT_RATE,
		    	       &pinv, sizeof(pinv)) ||
	    dccp_insert_option(sk, skb, TFRC_OPT_RECEIVE_RATE,
		    	       &x_recv, sizeof(x_recv)))
		return -1;

	return 0;
776 777 778 779 780 781 782 783
}

/* calculate first loss interval
 *
 * returns estimated loss interval in usecs */

static u32 ccid3_hc_rx_calc_first_li(struct sock *sk)
{
784
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
785
	struct dccp_rx_hist_entry *entry, *next, *tail = NULL;
786
	u32 rtt, delta, x_recv, fval, p, tmp2;
787
	struct timeval tstamp = { 0, };
788 789 790 791 792
	int interval = 0;
	int win_count = 0;
	int step = 0;
	u64 tmp1;

793 794 795
	list_for_each_entry_safe(entry, next, &hcrx->ccid3hcrx_hist,
				 dccphrx_node) {
		if (dccp_rx_hist_entry_data_packet(entry)) {
796 797 798 799
			tail = entry;

			switch (step) {
			case 0:
800
				tstamp	  = entry->dccphrx_tstamp;
801
				win_count = entry->dccphrx_ccval;
802 803 804
				step = 1;
				break;
			case 1:
805
				interval = win_count - entry->dccphrx_ccval;
806 807 808 809 810 811 812 813 814
				if (interval < 0)
					interval += TFRC_WIN_COUNT_LIMIT;
				if (interval > 4)
					goto found;
				break;
			}
		}
	}

815
	if (unlikely(step == 0)) {
816 817
		DCCP_WARN("%s, sk=%p, packet history has no data packets!\n",
			  dccp_role(sk), sk);
818 819 820
		return ~0;
	}

821
	if (unlikely(interval == 0)) {
822 823
		DCCP_WARN("%s, sk=%p, Could not find a win_count interval > 0."
			  "Defaulting to 1\n", dccp_role(sk), sk);
824 825 826
		interval = 1;
	}
found:
I
Ian McDonald 已提交
827
	if (!tail) {
828
		DCCP_CRIT("tail is null\n");
I
Ian McDonald 已提交
829 830
		return ~0;
	}
831
	rtt = timeval_delta(&tstamp, &tail->dccphrx_tstamp) * 4 / interval;
832 833
	ccid3_pr_debug("%s, sk=%p, approximated RTT to %uus\n",
		       dccp_role(sk), sk, rtt);
834 835 836 837 838

	if (rtt == 0) {
		DCCP_WARN("RTT==0, setting to 1\n");
 		rtt = 1;
	}
839

840 841 842
	dccp_timestamp(sk, &tstamp);
	delta = timeval_delta(&tstamp, &hcrx->ccid3hcrx_tstamp_last_feedback);
	x_recv = usecs_div(hcrx->ccid3hcrx_bytes_recv, delta);
843

I
Ian McDonald 已提交
844 845 846
	if (x_recv == 0)
		x_recv = hcrx->ccid3hcrx_x_recv;

847 848 849
	tmp1 = (u64)x_recv * (u64)rtt;
	do_div(tmp1,10000000);
	tmp2 = (u32)tmp1;
I
Ian McDonald 已提交
850 851

	if (!tmp2) {
852
		DCCP_CRIT("tmp2 = 0, x_recv = %u, rtt =%u\n", x_recv, rtt);
I
Ian McDonald 已提交
853 854 855
		return ~0;
	}

856 857
	fval = (hcrx->ccid3hcrx_s * 100000) / tmp2;
	/* do not alter order above or you will get overflow on 32 bit */
858
	p = tfrc_calc_x_reverse_lookup(fval);
859 860
	ccid3_pr_debug("%s, sk=%p, receive rate=%u bytes/s, implied "
		       "loss rate=%u\n", dccp_role(sk), sk, x_recv, p);
861 862 863 864 865 866 867 868 869

	if (p == 0)
		return ~0;
	else
		return 1000000 / p; 
}

static void ccid3_hc_rx_update_li(struct sock *sk, u64 seq_loss, u8 win_loss)
{
870
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
871
	struct dccp_li_hist_entry *head;
I
Ian McDonald 已提交
872
	u64 seq_temp;
873

I
Ian McDonald 已提交
874 875 876 877
	if (list_empty(&hcrx->ccid3hcrx_li_hist)) {
		if (!dccp_li_hist_interval_new(ccid3_li_hist,
		   &hcrx->ccid3hcrx_li_hist, seq_loss, win_loss))
			return;
878

879 880 881
		head = list_entry(hcrx->ccid3hcrx_li_hist.next,
		   struct dccp_li_hist_entry, dccplih_node);
		head->dccplih_interval = ccid3_hc_rx_calc_first_li(sk);
I
Ian McDonald 已提交
882 883 884 885
	} else {
		struct dccp_li_hist_entry *entry;
		struct list_head *tail;

886 887
		head = list_entry(hcrx->ccid3hcrx_li_hist.next,
		   struct dccp_li_hist_entry, dccplih_node);
I
Ian McDonald 已提交
888 889 890 891 892 893 894 895 896 897
		/* FIXME win count check removed as was wrong */
		/* should make this check with receive history */
		/* and compare there as per section 10.2 of RFC4342 */

		/* new loss event detected */
		/* calculate last interval length */
		seq_temp = dccp_delta_seqno(head->dccplih_seqno, seq_loss);
		entry = dccp_li_hist_entry_new(ccid3_li_hist, SLAB_ATOMIC);

		if (entry == NULL) {
898
			DCCP_BUG("out of memory - can not allocate entry");
899
			return;
I
Ian McDonald 已提交
900 901 902 903 904 905 906 907 908 909 910 911 912
		}

		list_add(&entry->dccplih_node, &hcrx->ccid3hcrx_li_hist);

		tail = hcrx->ccid3hcrx_li_hist.prev;
		list_del(tail);
		kmem_cache_free(ccid3_li_hist->dccplih_slab, tail);

		/* Create the newest interval */
		entry->dccplih_seqno = seq_loss;
		entry->dccplih_interval = seq_temp;
		entry->dccplih_win_count = win_loss;
	}
913 914
}

I
Ian McDonald 已提交
915 916
static int ccid3_hc_rx_detect_loss(struct sock *sk,
                                    struct dccp_rx_hist_entry *packet)
917
{
918
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
I
Ian McDonald 已提交
919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934
	struct dccp_rx_hist_entry *rx_hist = dccp_rx_hist_head(&hcrx->ccid3hcrx_hist);
	u64 seqno = packet->dccphrx_seqno;
	u64 tmp_seqno;
	int loss = 0;
	u8 ccval;


	tmp_seqno = hcrx->ccid3hcrx_seqno_nonloss;

	if (!rx_hist ||
	   follows48(packet->dccphrx_seqno, hcrx->ccid3hcrx_seqno_nonloss)) {
		hcrx->ccid3hcrx_seqno_nonloss = seqno;
		hcrx->ccid3hcrx_ccval_nonloss = packet->dccphrx_ccval;
		goto detect_out;
	}

935

I
Ian McDonald 已提交
936 937 938 939 940 941 942 943 944 945 946 947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964
	while (dccp_delta_seqno(hcrx->ccid3hcrx_seqno_nonloss, seqno)
	   > TFRC_RECV_NUM_LATE_LOSS) {
		loss = 1;
		ccid3_hc_rx_update_li(sk, hcrx->ccid3hcrx_seqno_nonloss,
		   hcrx->ccid3hcrx_ccval_nonloss);
		tmp_seqno = hcrx->ccid3hcrx_seqno_nonloss;
		dccp_inc_seqno(&tmp_seqno);
		hcrx->ccid3hcrx_seqno_nonloss = tmp_seqno;
		dccp_inc_seqno(&tmp_seqno);
		while (dccp_rx_hist_find_entry(&hcrx->ccid3hcrx_hist,
		   tmp_seqno, &ccval)) {
		   	hcrx->ccid3hcrx_seqno_nonloss = tmp_seqno;
			hcrx->ccid3hcrx_ccval_nonloss = ccval;
			dccp_inc_seqno(&tmp_seqno);
		}
	}

	/* FIXME - this code could be simplified with above while */
	/* but works at moment */
	if (follows48(packet->dccphrx_seqno, hcrx->ccid3hcrx_seqno_nonloss)) {
		hcrx->ccid3hcrx_seqno_nonloss = seqno;
		hcrx->ccid3hcrx_ccval_nonloss = packet->dccphrx_ccval;
	}

detect_out:
	dccp_rx_hist_add_packet(ccid3_rx_hist, &hcrx->ccid3hcrx_hist,
		   &hcrx->ccid3hcrx_li_hist, packet,
		   hcrx->ccid3hcrx_seqno_nonloss);
	return loss;
965 966 967 968
}

static void ccid3_hc_rx_packet_recv(struct sock *sk, struct sk_buff *skb)
{
969
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
970
	const struct dccp_options_received *opt_recv;
971
	struct dccp_rx_hist_entry *packet;
972
	struct timeval now;
I
Ian McDonald 已提交
973 974
	u32 p_prev, rtt_prev, r_sample, t_elapsed;
	int loss;
975

976
	BUG_ON(hcrx == NULL);
977

978
	opt_recv = &dccp_sk(sk)->dccps_options_received;
979

980 981 982 983 984
	switch (DCCP_SKB_CB(skb)->dccpd_type) {
	case DCCP_PKT_ACK:
		if (hcrx->ccid3hcrx_state == TFRC_RSTATE_NO_DATA)
			return;
	case DCCP_PKT_DATAACK:
985
		if (opt_recv->dccpor_timestamp_echo == 0)
986
			break;
I
Ian McDonald 已提交
987
		rtt_prev = hcrx->ccid3hcrx_rtt;
988
		dccp_timestamp(sk, &now);
989 990 991 992 993
		timeval_sub_usecs(&now, opt_recv->dccpor_timestamp_echo * 10);
		r_sample = timeval_usecs(&now);
		t_elapsed = opt_recv->dccpor_elapsed_time * 10;

		if (unlikely(r_sample <= t_elapsed))
994 995
			DCCP_WARN("r_sample=%uus, t_elapsed=%uus\n",
				  r_sample, t_elapsed);
996 997 998 999 1000 1001 1002 1003 1004
		else
			r_sample -= t_elapsed;

		if (hcrx->ccid3hcrx_state == TFRC_RSTATE_NO_DATA)
			hcrx->ccid3hcrx_rtt = r_sample;
		else
			hcrx->ccid3hcrx_rtt = (hcrx->ccid3hcrx_rtt * 9) / 10 +
					      r_sample / 10;

I
Ian McDonald 已提交
1005 1006
		if (rtt_prev != hcrx->ccid3hcrx_rtt)
			ccid3_pr_debug("%s, New RTT=%uus, elapsed time=%u\n",
1007 1008
				       dccp_role(sk), hcrx->ccid3hcrx_rtt,
				       opt_recv->dccpor_elapsed_time);
1009 1010 1011
		break;
	case DCCP_PKT_DATA:
		break;
1012
	default: /* We're not interested in other packet types, move along */
1013 1014 1015
		return;
	}

1016
	packet = dccp_rx_hist_entry_new(ccid3_rx_hist, sk, opt_recv->dccpor_ndp,
1017
					skb, SLAB_ATOMIC);
1018
	if (unlikely(packet == NULL)) {
1019 1020
		DCCP_WARN("%s, sk=%p, Not enough mem to add rx packet "
			  "to history, consider it lost!\n", dccp_role(sk), sk);
1021 1022 1023
		return;
	}

I
Ian McDonald 已提交
1024
	loss = ccid3_hc_rx_detect_loss(sk, packet);
1025 1026 1027 1028 1029 1030

	if (DCCP_SKB_CB(skb)->dccpd_type == DCCP_PKT_ACK)
		return;

	switch (hcrx->ccid3hcrx_state) {
	case TFRC_RSTATE_NO_DATA:
1031 1032 1033 1034
		ccid3_pr_debug("%s, sk=%p(%s), skb=%p, sending initial "
			       "feedback\n",
			       dccp_role(sk), sk,
			       dccp_state_name(sk->sk_state), skb);
1035 1036 1037 1038
		ccid3_hc_rx_send_feedback(sk);
		ccid3_hc_rx_set_state(sk, TFRC_RSTATE_DATA);
		return;
	case TFRC_RSTATE_DATA:
1039 1040
		hcrx->ccid3hcrx_bytes_recv += skb->len -
					      dccp_hdr(skb)->dccph_doff * 4;
I
Ian McDonald 已提交
1041
		if (loss)
1042 1043
			break;

1044
		dccp_timestamp(sk, &now);
1045 1046 1047 1048
		if (timeval_delta(&now, &hcrx->ccid3hcrx_tstamp_last_ack) >=
		    hcrx->ccid3hcrx_rtt) {
			hcrx->ccid3hcrx_tstamp_last_ack = now;
			ccid3_hc_rx_send_feedback(sk);
1049
		}
1050
		return;
1051 1052
	case TFRC_RSTATE_TERM:
		DCCP_BUG("Illegal %s state TERM, sk=%p", dccp_role(sk), sk);
1053 1054 1055 1056
		return;
	}

	/* Dealing with packet loss */
1057 1058
	ccid3_pr_debug("%s, sk=%p(%s), data loss! Reacting...\n",
		       dccp_role(sk), sk, dccp_state_name(sk->sk_state));
1059 1060 1061 1062

	p_prev = hcrx->ccid3hcrx_p;
	
	/* Calculate loss event rate */
I
Ian McDonald 已提交
1063 1064 1065
	if (!list_empty(&hcrx->ccid3hcrx_li_hist)) {
		u32 i_mean = dccp_li_hist_calc_i_mean(&hcrx->ccid3hcrx_li_hist);

1066
		/* Scaling up by 1000000 as fixed decimal */
I
Ian McDonald 已提交
1067 1068
		if (i_mean != 0)
			hcrx->ccid3hcrx_p = 1000000 / i_mean;
1069 1070
	} else
		DCCP_BUG("empty loss history");
1071 1072 1073 1074 1075 1076 1077

	if (hcrx->ccid3hcrx_p > p_prev) {
		ccid3_hc_rx_send_feedback(sk);
		return;
	}
}

1078
static int ccid3_hc_rx_init(struct ccid *ccid, struct sock *sk)
1079 1080
{
	struct dccp_sock *dp = dccp_sk(sk);
1081
	struct ccid3_hc_rx_sock *hcrx = ccid_priv(ccid);
1082 1083 1084

	ccid3_pr_debug("%s, sk=%p\n", dccp_role(sk), sk);

1085 1086 1087
	if (dp->dccps_packet_size >= TFRC_MIN_PACKET_SIZE &&
	    dp->dccps_packet_size <= TFRC_MAX_PACKET_SIZE)
		hcrx->ccid3hcrx_s = dp->dccps_packet_size;
1088 1089 1090 1091 1092
	else
		hcrx->ccid3hcrx_s = TFRC_STD_PACKET_SIZE;

	hcrx->ccid3hcrx_state = TFRC_RSTATE_NO_DATA;
	INIT_LIST_HEAD(&hcrx->ccid3hcrx_hist);
1093
	INIT_LIST_HEAD(&hcrx->ccid3hcrx_li_hist);
1094
	dccp_timestamp(sk, &hcrx->ccid3hcrx_tstamp_last_ack);
1095 1096
	hcrx->ccid3hcrx_tstamp_last_feedback = hcrx->ccid3hcrx_tstamp_last_ack;
	hcrx->ccid3hcrx_rtt = 5000; /* XXX 5ms for now... */
1097 1098 1099 1100 1101
	return 0;
}

static void ccid3_hc_rx_exit(struct sock *sk)
{
1102
	struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
1103

1104
	BUG_ON(hcrx == NULL);
1105 1106 1107 1108

	ccid3_hc_rx_set_state(sk, TFRC_RSTATE_TERM);

	/* Empty packet history */
1109
	dccp_rx_hist_purge(ccid3_rx_hist, &hcrx->ccid3hcrx_hist);
1110 1111

	/* Empty loss interval history */
1112
	dccp_li_hist_purge(ccid3_li_hist, &hcrx->ccid3hcrx_li_hist);
1113 1114
}

1115 1116
static void ccid3_hc_rx_get_info(struct sock *sk, struct tcp_info *info)
{
1117
	const struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
1118

1119 1120 1121 1122
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return;

1123
	BUG_ON(hcrx == NULL);
1124 1125 1126 1127 1128 1129 1130 1131

	info->tcpi_ca_state	= hcrx->ccid3hcrx_state;
	info->tcpi_options	|= TCPI_OPT_TIMESTAMPS;
	info->tcpi_rcv_rtt	= hcrx->ccid3hcrx_rtt;
}

static void ccid3_hc_tx_get_info(struct sock *sk, struct tcp_info *info)
{
1132
	const struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
1133

1134 1135 1136 1137
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return;

1138
	BUG_ON(hctx == NULL);
1139 1140 1141 1142 1143

	info->tcpi_rto = hctx->ccid3hctx_t_rto;
	info->tcpi_rtt = hctx->ccid3hctx_rtt;
}

1144 1145 1146 1147 1148 1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197
static int ccid3_hc_rx_getsockopt(struct sock *sk, const int optname, int len,
				  u32 __user *optval, int __user *optlen)
{
	const struct ccid3_hc_rx_sock *hcrx = ccid3_hc_rx_sk(sk);
	const void *val;
	
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return -EINVAL;

	switch (optname) {
	case DCCP_SOCKOPT_CCID_RX_INFO:
		if (len < sizeof(hcrx->ccid3hcrx_tfrc))
			return -EINVAL;
		len = sizeof(hcrx->ccid3hcrx_tfrc);
		val = &hcrx->ccid3hcrx_tfrc;
		break;
	default:
		return -ENOPROTOOPT;
	}

	if (put_user(len, optlen) || copy_to_user(optval, val, len))
		return -EFAULT;

	return 0;
}

static int ccid3_hc_tx_getsockopt(struct sock *sk, const int optname, int len,
				  u32 __user *optval, int __user *optlen)
{
	const struct ccid3_hc_tx_sock *hctx = ccid3_hc_tx_sk(sk);
	const void *val;
	
	/* Listen socks doesn't have a private CCID block */
	if (sk->sk_state == DCCP_LISTEN)
		return -EINVAL;

	switch (optname) {
	case DCCP_SOCKOPT_CCID_TX_INFO:
		if (len < sizeof(hctx->ccid3hctx_tfrc))
			return -EINVAL;
		len = sizeof(hctx->ccid3hctx_tfrc);
		val = &hctx->ccid3hctx_tfrc;
		break;
	default:
		return -ENOPROTOOPT;
	}

	if (put_user(len, optlen) || copy_to_user(optval, val, len))
		return -EFAULT;

	return 0;
}

1198
static struct ccid_operations ccid3 = {
I
Ian McDonald 已提交
1199
	.ccid_id		   = DCCPC_CCID3,
1200 1201
	.ccid_name		   = "ccid3",
	.ccid_owner		   = THIS_MODULE,
1202
	.ccid_hc_tx_obj_size	   = sizeof(struct ccid3_hc_tx_sock),
1203 1204 1205 1206 1207 1208 1209
	.ccid_hc_tx_init	   = ccid3_hc_tx_init,
	.ccid_hc_tx_exit	   = ccid3_hc_tx_exit,
	.ccid_hc_tx_send_packet	   = ccid3_hc_tx_send_packet,
	.ccid_hc_tx_packet_sent	   = ccid3_hc_tx_packet_sent,
	.ccid_hc_tx_packet_recv	   = ccid3_hc_tx_packet_recv,
	.ccid_hc_tx_insert_options = ccid3_hc_tx_insert_options,
	.ccid_hc_tx_parse_options  = ccid3_hc_tx_parse_options,
1210
	.ccid_hc_rx_obj_size	   = sizeof(struct ccid3_hc_rx_sock),
1211 1212 1213 1214
	.ccid_hc_rx_init	   = ccid3_hc_rx_init,
	.ccid_hc_rx_exit	   = ccid3_hc_rx_exit,
	.ccid_hc_rx_insert_options = ccid3_hc_rx_insert_options,
	.ccid_hc_rx_packet_recv	   = ccid3_hc_rx_packet_recv,
1215 1216
	.ccid_hc_rx_get_info	   = ccid3_hc_rx_get_info,
	.ccid_hc_tx_get_info	   = ccid3_hc_tx_get_info,
1217 1218
	.ccid_hc_rx_getsockopt	   = ccid3_hc_rx_getsockopt,
	.ccid_hc_tx_getsockopt	   = ccid3_hc_tx_getsockopt,
1219 1220
};
 
1221
#ifdef CONFIG_IP_DCCP_CCID3_DEBUG
1222 1223
module_param(ccid3_debug, int, 0444);
MODULE_PARM_DESC(ccid3_debug, "Enable debug messages");
1224
#endif
1225 1226 1227

static __init int ccid3_module_init(void)
{
1228
	int rc = -ENOBUFS;
1229

1230 1231
	ccid3_rx_hist = dccp_rx_hist_new("ccid3");
	if (ccid3_rx_hist == NULL)
1232 1233
		goto out;

1234 1235 1236
	ccid3_tx_hist = dccp_tx_hist_new("ccid3");
	if (ccid3_tx_hist == NULL)
		goto out_free_rx;
1237

1238 1239
	ccid3_li_hist = dccp_li_hist_new("ccid3");
	if (ccid3_li_hist == NULL)
1240
		goto out_free_tx;
1241 1242 1243 1244 1245 1246

	rc = ccid_register(&ccid3);
	if (rc != 0) 
		goto out_free_loss_interval_history;
out:
	return rc;
1247

1248
out_free_loss_interval_history:
1249 1250
	dccp_li_hist_delete(ccid3_li_hist);
	ccid3_li_hist = NULL;
1251 1252 1253 1254 1255 1256
out_free_tx:
	dccp_tx_hist_delete(ccid3_tx_hist);
	ccid3_tx_hist = NULL;
out_free_rx:
	dccp_rx_hist_delete(ccid3_rx_hist);
	ccid3_rx_hist = NULL;
1257 1258 1259 1260 1261 1262 1263 1264
	goto out;
}
module_init(ccid3_module_init);

static __exit void ccid3_module_exit(void)
{
	ccid_unregister(&ccid3);

1265 1266 1267
	if (ccid3_tx_hist != NULL) {
		dccp_tx_hist_delete(ccid3_tx_hist);
		ccid3_tx_hist = NULL;
1268
	}
1269 1270 1271
	if (ccid3_rx_hist != NULL) {
		dccp_rx_hist_delete(ccid3_rx_hist);
		ccid3_rx_hist = NULL;
1272
	}
1273 1274 1275
	if (ccid3_li_hist != NULL) {
		dccp_li_hist_delete(ccid3_li_hist);
		ccid3_li_hist = NULL;
1276 1277 1278 1279
	}
}
module_exit(ccid3_module_exit);

1280
MODULE_AUTHOR("Ian McDonald <ian.mcdonald@jandi.co.nz>, "
1281
	      "Arnaldo Carvalho de Melo <acme@ghostprotocols.net>");
1282 1283 1284
MODULE_DESCRIPTION("DCCP TFRC CCID3 CCID");
MODULE_LICENSE("GPL");
MODULE_ALIAS("net-dccp-ccid-3");