cq.c 29.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35
/*
 * Copyright (c) 2009-2010 Chelsio, Inc. All rights reserved.
 *
 * This software is available to you under a choice of one of two
 * licenses.  You may choose to be licensed under the terms of the GNU
 * General Public License (GPL) Version 2, available from the file
 * COPYING in the main directory of this source tree, or the
 * OpenIB.org BSD license below:
 *
 *     Redistribution and use in source and binary forms, with or
 *     without modification, are permitted provided that the following
 *     conditions are met:
 *
 *      - Redistributions of source code must retain the above
 *	  copyright notice, this list of conditions and the following
 *	  disclaimer.
 *
 *      - Redistributions in binary form must reproduce the above
 *	  copyright notice, this list of conditions and the following
 *	  disclaimer in the documentation and/or other materials
 *	  provided with the distribution.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 * SOFTWARE.
 */

#include "iw_cxgb4.h"

static int destroy_cq(struct c4iw_rdev *rdev, struct t4_cq *cq,
36 37
		      struct c4iw_dev_ucontext *uctx, struct sk_buff *skb,
		      struct c4iw_wr_wait *wr_waitp)
38 39 40 41 42 43 44 45 46
{
	struct fw_ri_res_wr *res_wr;
	struct fw_ri_res *res;
	int wr_len;
	int ret;

	wr_len = sizeof *res_wr + sizeof *res;
	set_wr_txq(skb, CPL_PRIORITY_CONTROL, 0);

47
	res_wr = __skb_put_zero(skb, wr_len);
48
	res_wr->op_nres = cpu_to_be32(
49
			FW_WR_OP_V(FW_RI_RES_WR) |
50
			FW_RI_RES_WR_NRES_V(1) |
51
			FW_WR_COMPL_F);
52
	res_wr->len16_pkd = cpu_to_be32(DIV_ROUND_UP(wr_len, 16));
53
	res_wr->cookie = (uintptr_t)wr_waitp;
54 55 56 57 58
	res = res_wr->res;
	res->u.cq.restype = FW_RI_RES_TYPE_CQ;
	res->u.cq.op = FW_RI_RES_OP_RESET;
	res->u.cq.iqid = cpu_to_be32(cq->cqid);

59
	c4iw_init_wr_wait(wr_waitp);
60
	ret = c4iw_ref_send_wait(rdev, skb, wr_waitp, 0, 0, __func__);
61 62 63 64

	kfree(cq->sw_queue);
	dma_free_coherent(&(rdev->lldi.pdev->dev),
			  cq->memsize, cq->queue,
65
			  dma_unmap_addr(cq, mapping));
66 67 68 69 70
	c4iw_put_cqid(rdev, cq->cqid, uctx);
	return ret;
}

static int create_cq(struct c4iw_rdev *rdev, struct t4_cq *cq,
71 72
		     struct c4iw_dev_ucontext *uctx,
		     struct c4iw_wr_wait *wr_waitp)
73 74 75 76 77 78 79
{
	struct fw_ri_res_wr *res_wr;
	struct fw_ri_res *res;
	int wr_len;
	int user = (uctx != &rdev->uctx);
	int ret;
	struct sk_buff *skb;
80 81 82 83
	struct c4iw_ucontext *ucontext = NULL;

	if (user)
		ucontext = container_of(uctx, struct c4iw_ucontext, uctx);
84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103

	cq->cqid = c4iw_get_cqid(rdev, uctx);
	if (!cq->cqid) {
		ret = -ENOMEM;
		goto err1;
	}

	if (!user) {
		cq->sw_queue = kzalloc(cq->memsize, GFP_KERNEL);
		if (!cq->sw_queue) {
			ret = -ENOMEM;
			goto err2;
		}
	}
	cq->queue = dma_alloc_coherent(&rdev->lldi.pdev->dev, cq->memsize,
				       &cq->dma_addr, GFP_KERNEL);
	if (!cq->queue) {
		ret = -ENOMEM;
		goto err3;
	}
104
	dma_unmap_addr_set(cq, mapping, cq->dma_addr);
105 106
	memset(cq->queue, 0, cq->memsize);

107 108 109 110 111 112 113 114 115 116
	if (user && ucontext->is_32b_cqe) {
		cq->qp_errp = &((struct t4_status_page *)
		((u8 *)cq->queue + (cq->size - 1) *
		 (sizeof(*cq->queue) / 2)))->qp_err;
	} else {
		cq->qp_errp = &((struct t4_status_page *)
		((u8 *)cq->queue + (cq->size - 1) *
		 sizeof(*cq->queue)))->qp_err;
	}

117 118 119
	/* build fw_ri_res_wr */
	wr_len = sizeof *res_wr + sizeof *res;

120
	skb = alloc_skb(wr_len, GFP_KERNEL);
121 122 123 124 125 126
	if (!skb) {
		ret = -ENOMEM;
		goto err4;
	}
	set_wr_txq(skb, CPL_PRIORITY_CONTROL, 0);

127
	res_wr = __skb_put_zero(skb, wr_len);
128
	res_wr->op_nres = cpu_to_be32(
129
			FW_WR_OP_V(FW_RI_RES_WR) |
130
			FW_RI_RES_WR_NRES_V(1) |
131
			FW_WR_COMPL_F);
132
	res_wr->len16_pkd = cpu_to_be32(DIV_ROUND_UP(wr_len, 16));
133
	res_wr->cookie = (uintptr_t)wr_waitp;
134 135 136 137 138
	res = res_wr->res;
	res->u.cq.restype = FW_RI_RES_TYPE_CQ;
	res->u.cq.op = FW_RI_RES_OP_WRITE;
	res->u.cq.iqid = cpu_to_be32(cq->cqid);
	res->u.cq.iqandst_to_iqandstindex = cpu_to_be32(
139 140 141 142
			FW_RI_RES_WR_IQANUS_V(0) |
			FW_RI_RES_WR_IQANUD_V(1) |
			FW_RI_RES_WR_IQANDST_F |
			FW_RI_RES_WR_IQANDSTINDEX_V(
143
				rdev->lldi.ciq_ids[cq->vector]));
144
	res->u.cq.iqdroprss_to_iqesize = cpu_to_be16(
145 146 147 148
			FW_RI_RES_WR_IQDROPRSS_F |
			FW_RI_RES_WR_IQPCIECH_V(2) |
			FW_RI_RES_WR_IQINTCNTTHRESH_V(0) |
			FW_RI_RES_WR_IQO_F |
149 150 151
			((user && ucontext->is_32b_cqe) ?
			 FW_RI_RES_WR_IQESIZE_V(1) :
			 FW_RI_RES_WR_IQESIZE_V(2)));
152 153 154
	res->u.cq.iqsize = cpu_to_be16(cq->size);
	res->u.cq.iqaddr = cpu_to_be64(cq->dma_addr);

155
	c4iw_init_wr_wait(wr_waitp);
156
	ret = c4iw_ref_send_wait(rdev, skb, wr_waitp, 0, 0, __func__);
157 158 159 160
	if (ret)
		goto err4;

	cq->gen = 1;
161
	cq->gts = rdev->lldi.gts_reg;
162
	cq->rdev = rdev;
163

164
	cq->bar2_va = c4iw_bar2_addrs(rdev, cq->cqid, CXGB4_BAR2_QTYPE_INGRESS,
165 166
				      &cq->bar2_qid,
				      user ? &cq->bar2_pa : NULL);
167
	if (user && !cq->bar2_pa) {
168
		pr_warn("%s: cqid %u not in BAR2 range\n",
169 170 171
			pci_name(rdev->lldi.pdev), cq->cqid);
		ret = -EINVAL;
		goto err4;
172 173 174 175
	}
	return 0;
err4:
	dma_free_coherent(&rdev->lldi.pdev->dev, cq->memsize, cq->queue,
176
			  dma_unmap_addr(cq, mapping));
177 178 179 180 181 182 183 184
err3:
	kfree(cq->sw_queue);
err2:
	c4iw_put_cqid(rdev, cq->cqid, uctx);
err1:
	return ret;
}

185
static void insert_recv_cqe(struct t4_wq *wq, struct t4_cq *cq, u32 srqidx)
186 187 188
{
	struct t4_cqe cqe;

189
	pr_debug("wq %p cq %p sw_cidx %u sw_pidx %u\n",
J
Joe Perches 已提交
190
		 wq, cq, cq->sw_cidx, cq->sw_pidx);
191
	memset(&cqe, 0, sizeof(cqe));
192 193 194 195 196 197
	cqe.header = cpu_to_be32(CQE_STATUS_V(T4_ERR_SWFLUSH) |
				 CQE_OPCODE_V(FW_RI_SEND) |
				 CQE_TYPE_V(0) |
				 CQE_SWCQE_V(1) |
				 CQE_QPID_V(wq->sq.qid));
	cqe.bits_type_ts = cpu_to_be64(CQE_GENBIT_V((u64)cq->gen));
198 199
	if (srqidx)
		cqe.u.srcqe.abs_rqe_idx = cpu_to_be32(srqidx);
200 201 202 203 204 205 206 207 208
	cq->sw_queue[cq->sw_pidx] = cqe;
	t4_swcq_produce(cq);
}

int c4iw_flush_rq(struct t4_wq *wq, struct t4_cq *cq, int count)
{
	int flushed = 0;
	int in_use = wq->rq.in_use - count;

209
	pr_debug("wq %p cq %p rq.in_use %u skip count %u\n",
J
Joe Perches 已提交
210
		 wq, cq, wq->rq.in_use, count);
211
	while (in_use--) {
212
		insert_recv_cqe(wq, cq, 0);
213 214 215 216 217 218 219 220 221 222
		flushed++;
	}
	return flushed;
}

static void insert_sq_cqe(struct t4_wq *wq, struct t4_cq *cq,
			  struct t4_swsqe *swcqe)
{
	struct t4_cqe cqe;

223
	pr_debug("wq %p cq %p sw_cidx %u sw_pidx %u\n",
J
Joe Perches 已提交
224
		 wq, cq, cq->sw_cidx, cq->sw_pidx);
225
	memset(&cqe, 0, sizeof(cqe));
226 227 228 229 230
	cqe.header = cpu_to_be32(CQE_STATUS_V(T4_ERR_SWFLUSH) |
				 CQE_OPCODE_V(swcqe->opcode) |
				 CQE_TYPE_V(1) |
				 CQE_SWCQE_V(1) |
				 CQE_QPID_V(wq->sq.qid));
231
	CQE_WRID_SQ_IDX(&cqe) = swcqe->idx;
232
	cqe.bits_type_ts = cpu_to_be64(CQE_GENBIT_V((u64)cq->gen));
233 234 235 236
	cq->sw_queue[cq->sw_pidx] = cqe;
	t4_swcq_produce(cq);
}

S
Steve Wise 已提交
237 238 239
static void advance_oldest_read(struct t4_wq *wq);

int c4iw_flush_sq(struct c4iw_qp *qhp)
240 241
{
	int flushed = 0;
S
Steve Wise 已提交
242 243 244 245 246 247 248 249 250 251
	struct t4_wq *wq = &qhp->wq;
	struct c4iw_cq *chp = to_c4iw_cq(qhp->ibqp.send_cq);
	struct t4_cq *cq = &chp->cq;
	int idx;
	struct t4_swsqe *swsqe;

	if (wq->sq.flush_cidx == -1)
		wq->sq.flush_cidx = wq->sq.cidx;
	idx = wq->sq.flush_cidx;
	while (idx != wq->sq.pidx) {
S
Steve Wise 已提交
252 253 254 255 256
		swsqe = &wq->sq.sw_sq[idx];
		swsqe->flushed = 1;
		insert_sq_cqe(wq, cq, swsqe);
		if (wq->sq.oldest_read == swsqe) {
			advance_oldest_read(wq);
S
Steve Wise 已提交
257
		}
S
Steve Wise 已提交
258
		flushed++;
S
Steve Wise 已提交
259 260
		if (++idx == wq->sq.size)
			idx = 0;
261
	}
S
Steve Wise 已提交
262 263 264
	wq->sq.flush_cidx += flushed;
	if (wq->sq.flush_cidx >= wq->sq.size)
		wq->sq.flush_cidx -= wq->sq.size;
265 266 267
	return flushed;
}

S
Steve Wise 已提交
268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286
static void flush_completed_wrs(struct t4_wq *wq, struct t4_cq *cq)
{
	struct t4_swsqe *swsqe;
	int cidx;

	if (wq->sq.flush_cidx == -1)
		wq->sq.flush_cidx = wq->sq.cidx;
	cidx = wq->sq.flush_cidx;

	while (cidx != wq->sq.pidx) {
		swsqe = &wq->sq.sw_sq[cidx];
		if (!swsqe->signaled) {
			if (++cidx == wq->sq.size)
				cidx = 0;
		} else if (swsqe->complete) {

			/*
			 * Insert this completed cqe into the swcq.
			 */
287 288
			pr_debug("moving cqe into swcq sq idx %u cq idx %u\n",
				 cidx, cq->sw_pidx);
289
			swsqe->cqe.header |= htonl(CQE_SWCQE_V(1));
S
Steve Wise 已提交
290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305
			cq->sw_queue[cq->sw_pidx] = swsqe->cqe;
			t4_swcq_produce(cq);
			swsqe->flushed = 1;
			if (++cidx == wq->sq.size)
				cidx = 0;
			wq->sq.flush_cidx = cidx;
		} else
			break;
	}
}

static void create_read_req_cqe(struct t4_wq *wq, struct t4_cqe *hw_cqe,
		struct t4_cqe *read_cqe)
{
	read_cqe->u.scqe.cidx = wq->sq.oldest_read->idx;
	read_cqe->len = htonl(wq->sq.oldest_read->read_len);
306 307 308 309
	read_cqe->header = htonl(CQE_QPID_V(CQE_QPID(hw_cqe)) |
			CQE_SWCQE_V(SW_CQE(hw_cqe)) |
			CQE_OPCODE_V(FW_RI_READ_REQ) |
			CQE_TYPE_V(1));
S
Steve Wise 已提交
310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330
	read_cqe->bits_type_ts = hw_cqe->bits_type_ts;
}

static void advance_oldest_read(struct t4_wq *wq)
{

	u32 rptr = wq->sq.oldest_read - wq->sq.sw_sq + 1;

	if (rptr == wq->sq.size)
		rptr = 0;
	while (rptr != wq->sq.pidx) {
		wq->sq.oldest_read = &wq->sq.sw_sq[rptr];

		if (wq->sq.oldest_read->opcode == FW_RI_READ_REQ)
			return;
		if (++rptr == wq->sq.size)
			rptr = 0;
	}
	wq->sq.oldest_read = NULL;
}

331 332
/*
 * Move all CQEs from the HWCQ into the SWCQ.
S
Steve Wise 已提交
333 334
 * Deal with out-of-order and/or completions that complete
 * prior unsignalled WRs.
335
 */
336
void c4iw_flush_hw_cq(struct c4iw_cq *chp, struct c4iw_qp *flush_qhp)
337
{
S
Steve Wise 已提交
338 339 340
	struct t4_cqe *hw_cqe, *swcqe, read_cqe;
	struct c4iw_qp *qhp;
	struct t4_swsqe *swsqe;
341 342
	int ret;

343
	pr_debug("cqid 0x%x\n", chp->cq.cqid);
S
Steve Wise 已提交
344 345 346 347 348 349 350
	ret = t4_next_hw_cqe(&chp->cq, &hw_cqe);

	/*
	 * This logic is similar to poll_cq(), but not quite the same
	 * unfortunately.  Need to move pertinent HW CQEs to the SW CQ but
	 * also do any translation magic that poll_cq() normally does.
	 */
351
	while (!ret) {
S
Steve Wise 已提交
352 353 354 355 356 357 358 359
		qhp = get_qhp(chp->rhp, CQE_QPID(hw_cqe));

		/*
		 * drop CQEs with no associated QP
		 */
		if (qhp == NULL)
			goto next_cqe;

360 361 362 363 364 365 366
		if (flush_qhp != qhp) {
			spin_lock(&qhp->lock);

			if (qhp->wq.flushed == 1)
				goto next_cqe;
		}

S
Steve Wise 已提交
367 368 369 370 371
		if (CQE_OPCODE(hw_cqe) == FW_RI_TERMINATE)
			goto next_cqe;

		if (CQE_OPCODE(hw_cqe) == FW_RI_READ_RESP) {

372 373 374 375 376 377 378 379
			/* If we have reached here because of async
			 * event or other error, and have egress error
			 * then drop
			 */
			if (CQE_TYPE(hw_cqe) == 1)
				goto next_cqe;

			/* drop peer2peer RTR reads.
S
Steve Wise 已提交
380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411
			 */
			if (CQE_WRID_STAG(hw_cqe) == 1)
				goto next_cqe;

			/*
			 * Eat completions for unsignaled read WRs.
			 */
			if (!qhp->wq.sq.oldest_read->signaled) {
				advance_oldest_read(&qhp->wq);
				goto next_cqe;
			}

			/*
			 * Don't write to the HWCQ, create a new read req CQE
			 * in local memory and move it into the swcq.
			 */
			create_read_req_cqe(&qhp->wq, hw_cqe, &read_cqe);
			hw_cqe = &read_cqe;
			advance_oldest_read(&qhp->wq);
		}

		/* if its a SQ completion, then do the magic to move all the
		 * unsignaled and now in-order completions into the swcq.
		 */
		if (SQ_TYPE(hw_cqe)) {
			swsqe = &qhp->wq.sq.sw_sq[CQE_WRID_SQ_IDX(hw_cqe)];
			swsqe->cqe = *hw_cqe;
			swsqe->complete = 1;
			flush_completed_wrs(&qhp->wq, &chp->cq);
		} else {
			swcqe = &chp->cq.sw_queue[chp->cq.sw_pidx];
			*swcqe = *hw_cqe;
412
			swcqe->header |= cpu_to_be32(CQE_SWCQE_V(1));
S
Steve Wise 已提交
413 414 415 416 417
			t4_swcq_produce(&chp->cq);
		}
next_cqe:
		t4_hwcq_consume(&chp->cq);
		ret = t4_next_hw_cqe(&chp->cq, &hw_cqe);
418 419
		if (qhp && flush_qhp != qhp)
			spin_unlock(&qhp->lock);
420 421 422 423 424
	}
}

static int cqe_completes_wr(struct t4_cqe *cqe, struct t4_wq *wq)
{
425
	if (DRAIN_CQE(cqe)) {
426 427 428 429
		WARN_ONCE(1, "Unexpected DRAIN CQE qp id %u!\n", wq->sq.qid);
		return 0;
	}

430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449
	if (CQE_OPCODE(cqe) == FW_RI_TERMINATE)
		return 0;

	if ((CQE_OPCODE(cqe) == FW_RI_RDMA_WRITE) && RQ_TYPE(cqe))
		return 0;

	if ((CQE_OPCODE(cqe) == FW_RI_READ_RESP) && SQ_TYPE(cqe))
		return 0;

	if (CQE_SEND_OPCODE(cqe) && RQ_TYPE(cqe) && t4_rq_empty(wq))
		return 0;
	return 1;
}

void c4iw_count_rcqes(struct t4_cq *cq, struct t4_wq *wq, int *count)
{
	struct t4_cqe *cqe;
	u32 ptr;

	*count = 0;
450
	pr_debug("count zero %d\n", *count);
451 452 453 454
	ptr = cq->sw_cidx;
	while (ptr != cq->sw_pidx) {
		cqe = &cq->sw_queue[ptr];
		if (RQ_TYPE(cqe) && (CQE_OPCODE(cqe) != FW_RI_READ_RESP) &&
455
		    (CQE_QPID(cqe) == wq->sq.qid) && cqe_completes_wr(cqe, wq))
456 457 458 459
			(*count)++;
		if (++ptr == cq->size)
			ptr = 0;
	}
460
	pr_debug("cq %p count %d\n", cq, *count);
461 462
}

463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528
static void post_pending_srq_wrs(struct t4_srq *srq)
{
	struct t4_srq_pending_wr *pwr;
	u16 idx = 0;

	while (srq->pending_in_use) {
		pwr = &srq->pending_wrs[srq->pending_cidx];
		srq->sw_rq[srq->pidx].wr_id = pwr->wr_id;
		srq->sw_rq[srq->pidx].valid = 1;

		pr_debug("%s posting pending cidx %u pidx %u wq_pidx %u in_use %u rq_size %u wr_id %llx\n",
			 __func__,
			 srq->cidx, srq->pidx, srq->wq_pidx,
			 srq->in_use, srq->size,
			 (unsigned long long)pwr->wr_id);

		c4iw_copy_wr_to_srq(srq, &pwr->wqe, pwr->len16);
		t4_srq_consume_pending_wr(srq);
		t4_srq_produce(srq, pwr->len16);
		idx += DIV_ROUND_UP(pwr->len16 * 16, T4_EQ_ENTRY_SIZE);
	}

	if (idx) {
		t4_ring_srq_db(srq, idx, pwr->len16, &pwr->wqe);
		srq->queue[srq->size].status.host_wq_pidx =
			srq->wq_pidx;
	}
}

static u64 reap_srq_cqe(struct t4_cqe *hw_cqe, struct t4_srq *srq)
{
	int rel_idx = CQE_ABS_RQE_IDX(hw_cqe) - srq->rqt_abs_idx;
	u64 wr_id;

	srq->sw_rq[rel_idx].valid = 0;
	wr_id = srq->sw_rq[rel_idx].wr_id;

	if (rel_idx == srq->cidx) {
		pr_debug("%s in order cqe rel_idx %u cidx %u pidx %u wq_pidx %u in_use %u rq_size %u wr_id %llx\n",
			 __func__, rel_idx, srq->cidx, srq->pidx,
			 srq->wq_pidx, srq->in_use, srq->size,
			 (unsigned long long)srq->sw_rq[rel_idx].wr_id);
		t4_srq_consume(srq);
		while (srq->ooo_count && !srq->sw_rq[srq->cidx].valid) {
			pr_debug("%s eat ooo cidx %u pidx %u wq_pidx %u in_use %u rq_size %u ooo_count %u wr_id %llx\n",
				 __func__, srq->cidx, srq->pidx,
				 srq->wq_pidx, srq->in_use,
				 srq->size, srq->ooo_count,
				 (unsigned long long)
				 srq->sw_rq[srq->cidx].wr_id);
			t4_srq_consume_ooo(srq);
		}
		if (srq->ooo_count == 0 && srq->pending_in_use)
			post_pending_srq_wrs(srq);
	} else {
		pr_debug("%s ooo cqe rel_idx %u cidx %u pidx %u wq_pidx %u in_use %u rq_size %u ooo_count %u wr_id %llx\n",
			 __func__, rel_idx, srq->cidx,
			 srq->pidx, srq->wq_pidx,
			 srq->in_use, srq->size,
			 srq->ooo_count,
			 (unsigned long long)srq->sw_rq[rel_idx].wr_id);
		t4_srq_produce_ooo(srq);
	}
	return wr_id;
}

529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545
/*
 * poll_cq
 *
 * Caller must:
 *     check the validity of the first CQE,
 *     supply the wq assicated with the qpid.
 *
 * credit: cq credit to return to sge.
 * cqe_flushed: 1 iff the CQE is flushed.
 * cqe: copy of the polled CQE.
 *
 * return value:
 *    0		    CQE returned ok.
 *    -EAGAIN       CQE skipped, try again.
 *    -EOVERFLOW    CQ overflow detected.
 */
static int poll_cq(struct t4_wq *wq, struct t4_cq *cq, struct t4_cqe *cqe,
546 547
		   u8 *cqe_flushed, u64 *cookie, u32 *credit,
		   struct t4_srq *srq)
548 549 550 551 552 553 554 555 556 557
{
	int ret = 0;
	struct t4_cqe *hw_cqe, read_cqe;

	*cqe_flushed = 0;
	*credit = 0;
	ret = t4_next_cqe(cq, &hw_cqe);
	if (ret)
		return ret;

558 559
	pr_debug("CQE OVF %u qpid 0x%0x genbit %u type %u status 0x%0x opcode 0x%0x len 0x%0x wrid_hi_stag 0x%x wrid_low_msn 0x%x\n",
		 CQE_OVFBIT(hw_cqe), CQE_QPID(hw_cqe),
J
Joe Perches 已提交
560 561 562
		 CQE_GENBIT(hw_cqe), CQE_TYPE(hw_cqe), CQE_STATUS(hw_cqe),
		 CQE_OPCODE(hw_cqe), CQE_LEN(hw_cqe), CQE_WRID_HI(hw_cqe),
		 CQE_WRID_LOW(hw_cqe));
563 564 565 566 567 568 569 570 571

	/*
	 * skip cqe's not affiliated with a QP.
	 */
	if (wq == NULL) {
		ret = -EAGAIN;
		goto skip_cqe;
	}

S
Steve Wise 已提交
572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587
	/*
	* skip hw cqe's if the wq is flushed.
	*/
	if (wq->flushed && !SW_CQE(hw_cqe)) {
		ret = -EAGAIN;
		goto skip_cqe;
	}

	/*
	 * skip TERMINATE cqes...
	 */
	if (CQE_OPCODE(hw_cqe) == FW_RI_TERMINATE) {
		ret = -EAGAIN;
		goto skip_cqe;
	}

588 589 590
	/*
	 * Special cqe for drain WR completions...
	 */
591
	if (DRAIN_CQE(hw_cqe)) {
592 593 594 595 596
		*cookie = CQE_DRAIN_COOKIE(hw_cqe);
		*cqe = *hw_cqe;
		goto skip_cqe;
	}

597 598 599 600 601 602 603 604 605
	/*
	 * Gotta tweak READ completions:
	 *	1) the cqe doesn't contain the sq_wptr from the wr.
	 *	2) opcode not reflected from the wr.
	 *	3) read_len not reflected from the wr.
	 *	4) cq_type is RQ_TYPE not SQ_TYPE.
	 */
	if (RQ_TYPE(hw_cqe) && (CQE_OPCODE(hw_cqe) == FW_RI_READ_RESP)) {

606 607 608 609 610 611
		/* If we have reached here because of async
		 * event or other error, and have egress error
		 * then drop
		 */
		if (CQE_TYPE(hw_cqe) == 1) {
			if (CQE_STATUS(hw_cqe))
612
				t4_set_wq_in_error(wq, 0);
613 614 615 616 617
			ret = -EAGAIN;
			goto skip_cqe;
		}

		/* If this is an unsolicited read response, then the read
618 619 620
		 * was generated by the kernel driver as part of peer-2-peer
		 * connection setup.  So ignore the completion.
		 */
S
Steve Wise 已提交
621
		if (CQE_WRID_STAG(hw_cqe) == 1) {
622
			if (CQE_STATUS(hw_cqe))
623
				t4_set_wq_in_error(wq, 0);
624 625 626 627
			ret = -EAGAIN;
			goto skip_cqe;
		}

S
Steve Wise 已提交
628 629 630 631 632 633 634 635 636
		/*
		 * Eat completions for unsignaled read WRs.
		 */
		if (!wq->sq.oldest_read->signaled) {
			advance_oldest_read(wq);
			ret = -EAGAIN;
			goto skip_cqe;
		}

637 638 639 640 641 642 643 644 645 646
		/*
		 * Don't write to the HWCQ, so create a new read req CQE
		 * in local memory.
		 */
		create_read_req_cqe(wq, hw_cqe, &read_cqe);
		hw_cqe = &read_cqe;
		advance_oldest_read(wq);
	}

	if (CQE_STATUS(hw_cqe) || t4_wq_in_error(wq)) {
S
Steve Wise 已提交
647
		*cqe_flushed = (CQE_STATUS(hw_cqe) == T4_ERR_SWFLUSH);
648
		t4_set_wq_in_error(wq, 0);
S
Steve Wise 已提交
649 650
	}

651 652 653 654 655 656 657 658 659 660 661
	/*
	 * RECV completion.
	 */
	if (RQ_TYPE(hw_cqe)) {

		/*
		 * HW only validates 4 bits of MSN.  So we must validate that
		 * the MSN in the SEND is the next expected MSN.  If its not,
		 * then we complete this with T4_ERR_MSN and mark the wq in
		 * error.
		 */
662 663
		if (unlikely(!CQE_STATUS(hw_cqe) &&
			     CQE_WRID_MSN(hw_cqe) != wq->rq.msn)) {
664
			t4_set_wq_in_error(wq, 0);
665
			hw_cqe->header |= cpu_to_be32(CQE_STATUS_V(T4_ERR_MSN));
666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683
		}
		goto proc_cqe;
	}

	/*
	 * If we get here its a send completion.
	 *
	 * Handle out of order completion. These get stuffed
	 * in the SW SQ. Then the SW SQ is walked to move any
	 * now in-order completions into the SW CQ.  This handles
	 * 2 cases:
	 *	1) reaping unsignaled WRs when the first subsequent
	 *	   signaled WR is completed.
	 *	2) out of order read completions.
	 */
	if (!SW_CQE(hw_cqe) && (CQE_WRID_SQ_IDX(hw_cqe) != wq->sq.cidx)) {
		struct t4_swsqe *swsqe;

684 685
		pr_debug("out of order completion going in sw_sq at idx %u\n",
			 CQE_WRID_SQ_IDX(hw_cqe));
686 687 688 689 690 691 692 693 694 695 696 697 698 699 700
		swsqe = &wq->sq.sw_sq[CQE_WRID_SQ_IDX(hw_cqe)];
		swsqe->cqe = *hw_cqe;
		swsqe->complete = 1;
		ret = -EAGAIN;
		goto flush_wq;
	}

proc_cqe:
	*cqe = *hw_cqe;

	/*
	 * Reap the associated WR(s) that are freed up with this
	 * completion.
	 */
	if (SQ_TYPE(hw_cqe)) {
S
Steve Wise 已提交
701 702 703 704 705 706 707 708
		int idx = CQE_WRID_SQ_IDX(hw_cqe);

		/*
		* Account for any unsignaled completions completed by
		* this signaled completion.  In this case, cidx points
		* to the first unsignaled one, and idx points to the
		* signaled one.  So adjust in_use based on this delta.
		* if this is not completing any unsigned wrs, then the
709
		* delta will be 0. Handle wrapping also!
S
Steve Wise 已提交
710
		*/
711 712 713 714
		if (idx < wq->sq.cidx)
			wq->sq.in_use -= wq->sq.size + idx - wq->sq.cidx;
		else
			wq->sq.in_use -= idx - wq->sq.cidx;
S
Steve Wise 已提交
715 716

		wq->sq.cidx = (uint16_t)idx;
717
		pr_debug("completing sq idx %u\n", wq->sq.cidx);
718
		*cookie = wq->sq.sw_sq[wq->sq.cidx].wr_id;
719 720
		if (c4iw_wr_log)
			c4iw_log_wr_stats(wq, hw_cqe);
721 722
		t4_sq_consume(wq);
	} else {
723 724 725 726 727 728 729 730 731 732
		if (!srq) {
			pr_debug("completing rq idx %u\n", wq->rq.cidx);
			*cookie = wq->rq.sw_rq[wq->rq.cidx].wr_id;
			if (c4iw_wr_log)
				c4iw_log_wr_stats(wq, hw_cqe);
			t4_rq_consume(wq);
		} else {
			*cookie = reap_srq_cqe(hw_cqe, srq);
		}
		wq->rq.msn++;
S
Steve Wise 已提交
733
		goto skip_cqe;
734 735 736 737 738 739 740 741 742 743
	}

flush_wq:
	/*
	 * Flush any completed cqes that are now in-order.
	 */
	flush_completed_wrs(wq, cq);

skip_cqe:
	if (SW_CQE(hw_cqe)) {
744 745
		pr_debug("cq %p cqid 0x%x skip sw cqe cidx %u\n",
			 cq, cq->cqid, cq->sw_cidx);
746 747
		t4_swcq_consume(cq);
	} else {
748 749
		pr_debug("cq %p cqid 0x%x skip hw cqe cidx %u\n",
			 cq, cq->cqid, cq->cidx);
750 751 752 753 754
		t4_hwcq_consume(cq);
	}
	return ret;
}

755
static int __c4iw_poll_cq_one(struct c4iw_cq *chp, struct c4iw_qp *qhp,
756
			      struct ib_wc *wc, struct c4iw_srq *srq)
757
{
758
	struct t4_cqe uninitialized_var(cqe);
759
	struct t4_wq *wq = qhp ? &qhp->wq : NULL;
760 761 762 763 764
	u32 credit = 0;
	u8 cqe_flushed;
	u64 cookie = 0;
	int ret;

765 766
	ret = poll_cq(wq, &(chp->cq), &cqe, &cqe_flushed, &cookie, &credit,
		      srq ? &srq->wq : NULL);
767 768 769 770
	if (ret)
		goto out;

	wc->wr_id = cookie;
771
	wc->qp = qhp ? &qhp->ibqp : NULL;
772 773 774
	wc->vendor_err = CQE_STATUS(&cqe);
	wc->wc_flags = 0;

775 776 777 778 779 780 781
	/*
	 * Simulate a SRQ_LIMIT_REACHED HW notification if required.
	 */
	if (srq && !(srq->flags & T4_SRQ_LIMIT_SUPPORT) && srq->armed &&
	    srq->wq.in_use < srq->srq_limit)
		c4iw_dispatch_srq_limit_reached_event(srq);

782 783
	pr_debug("qpid 0x%x type %d opcode %d status 0x%x len %u wrid hi 0x%x lo 0x%x cookie 0x%llx\n",
		 CQE_QPID(&cqe),
J
Joe Perches 已提交
784 785 786 787
		 CQE_TYPE(&cqe), CQE_OPCODE(&cqe),
		 CQE_STATUS(&cqe), CQE_LEN(&cqe),
		 CQE_WRID_HI(&cqe), CQE_WRID_LOW(&cqe),
		 (unsigned long long)cookie);
788 789 790 791 792 793

	if (CQE_TYPE(&cqe) == 0) {
		if (!CQE_STATUS(&cqe))
			wc->byte_len = CQE_LEN(&cqe);
		else
			wc->byte_len = 0;
794 795 796 797 798 799 800 801

		switch (CQE_OPCODE(&cqe)) {
		case FW_RI_SEND:
			wc->opcode = IB_WC_RECV;
			break;
		case FW_RI_SEND_WITH_INV:
		case FW_RI_SEND_WITH_SE_INV:
			wc->opcode = IB_WC_RECV;
802 803
			wc->ex.invalidate_rkey = CQE_WRID_STAG(&cqe);
			wc->wc_flags |= IB_WC_WITH_INVALIDATE;
804
			c4iw_invalidate_mr(qhp->rhp, wc->ex.invalidate_rkey);
805 806 807 808 809 810 811 812 813 814 815
			break;
		case FW_RI_WRITE_IMMEDIATE:
			wc->opcode = IB_WC_RECV_RDMA_WITH_IMM;
			wc->ex.imm_data = CQE_IMM_DATA(&cqe);
			wc->wc_flags |= IB_WC_WITH_IMM;
			break;
		default:
			pr_err("Unexpected opcode %d in the CQE received for QPID=0x%0x\n",
			       CQE_OPCODE(&cqe), CQE_QPID(&cqe));
			ret = -EINVAL;
			goto out;
816 817 818
		}
	} else {
		switch (CQE_OPCODE(&cqe)) {
819
		case FW_RI_WRITE_IMMEDIATE:
820 821 822 823 824 825 826 827 828 829 830 831 832 833 834 835 836 837 838 839 840
		case FW_RI_RDMA_WRITE:
			wc->opcode = IB_WC_RDMA_WRITE;
			break;
		case FW_RI_READ_REQ:
			wc->opcode = IB_WC_RDMA_READ;
			wc->byte_len = CQE_LEN(&cqe);
			break;
		case FW_RI_SEND_WITH_INV:
		case FW_RI_SEND_WITH_SE_INV:
			wc->opcode = IB_WC_SEND;
			wc->wc_flags |= IB_WC_WITH_INVALIDATE;
			break;
		case FW_RI_SEND:
		case FW_RI_SEND_WITH_SE:
			wc->opcode = IB_WC_SEND;
			break;

		case FW_RI_LOCAL_INV:
			wc->opcode = IB_WC_LOCAL_INV;
			break;
		case FW_RI_FAST_REGISTER:
S
Sagi Grimberg 已提交
841
			wc->opcode = IB_WC_REG_MR;
842 843 844

			/* Invalidate the MR if the fastreg failed */
			if (CQE_STATUS(&cqe) != T4_ERR_SUCCESS)
845 846
				c4iw_invalidate_mr(qhp->rhp,
						   CQE_WRID_FR_STAG(&cqe));
847 848
			break;
		default:
849
			pr_err("Unexpected opcode %d in the CQE received for QPID=0x%0x\n",
850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896
			       CQE_OPCODE(&cqe), CQE_QPID(&cqe));
			ret = -EINVAL;
			goto out;
		}
	}

	if (cqe_flushed)
		wc->status = IB_WC_WR_FLUSH_ERR;
	else {

		switch (CQE_STATUS(&cqe)) {
		case T4_ERR_SUCCESS:
			wc->status = IB_WC_SUCCESS;
			break;
		case T4_ERR_STAG:
			wc->status = IB_WC_LOC_ACCESS_ERR;
			break;
		case T4_ERR_PDID:
			wc->status = IB_WC_LOC_PROT_ERR;
			break;
		case T4_ERR_QPID:
		case T4_ERR_ACCESS:
			wc->status = IB_WC_LOC_ACCESS_ERR;
			break;
		case T4_ERR_WRAP:
			wc->status = IB_WC_GENERAL_ERR;
			break;
		case T4_ERR_BOUND:
			wc->status = IB_WC_LOC_LEN_ERR;
			break;
		case T4_ERR_INVALIDATE_SHARED_MR:
		case T4_ERR_INVALIDATE_MR_WITH_MW_BOUND:
			wc->status = IB_WC_MW_BIND_ERR;
			break;
		case T4_ERR_CRC:
		case T4_ERR_MARKER:
		case T4_ERR_PDU_LEN_ERR:
		case T4_ERR_OUT_OF_RQE:
		case T4_ERR_DDP_VERSION:
		case T4_ERR_RDMA_VERSION:
		case T4_ERR_DDP_QUEUE_NUM:
		case T4_ERR_MSN:
		case T4_ERR_TBIT:
		case T4_ERR_MO:
		case T4_ERR_MSN_RANGE:
		case T4_ERR_IRD_OVERFLOW:
		case T4_ERR_OPCODE:
S
Steve Wise 已提交
897
		case T4_ERR_INTERNAL_ERR:
898 899 900 901 902 903
			wc->status = IB_WC_FATAL_ERR;
			break;
		case T4_ERR_SWFLUSH:
			wc->status = IB_WC_WR_FLUSH_ERR;
			break;
		default:
904
			pr_err("Unexpected cqe_status 0x%x for QPID=0x%0x\n",
905
			       CQE_STATUS(&cqe), CQE_QPID(&cqe));
906
			wc->status = IB_WC_FATAL_ERR;
907 908 909
		}
	}
out:
910 911 912 913 914 915 916 917 918 919 920 921 922 923
	return ret;
}

/*
 * Get one cq entry from c4iw and map it to openib.
 *
 * Returns:
 *	0			cqe returned
 *	-ENODATA		EMPTY;
 *	-EAGAIN			caller must try again
 *	any other -errno	fatal error
 */
static int c4iw_poll_cq_one(struct c4iw_cq *chp, struct ib_wc *wc)
{
924
	struct c4iw_srq *srq = NULL;
925 926 927 928 929 930 931 932 933 934 935 936
	struct c4iw_qp *qhp = NULL;
	struct t4_cqe *rd_cqe;
	int ret;

	ret = t4_next_cqe(&chp->cq, &rd_cqe);

	if (ret)
		return ret;

	qhp = get_qhp(chp->rhp, CQE_QPID(rd_cqe));
	if (qhp) {
		spin_lock(&qhp->lock);
937 938 939 940
		srq = qhp->srq;
		if (srq)
			spin_lock(&srq->lock);
		ret = __c4iw_poll_cq_one(chp, qhp, wc, srq);
941
		spin_unlock(&qhp->lock);
942 943
		if (srq)
			spin_unlock(&srq->lock);
944
	} else {
945
		ret = __c4iw_poll_cq_one(chp, NULL, wc, NULL);
946
	}
947 948 949 950 951 952 953 954 955 956 957 958 959 960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975
	return ret;
}

int c4iw_poll_cq(struct ib_cq *ibcq, int num_entries, struct ib_wc *wc)
{
	struct c4iw_cq *chp;
	unsigned long flags;
	int npolled;
	int err = 0;

	chp = to_c4iw_cq(ibcq);

	spin_lock_irqsave(&chp->lock, flags);
	for (npolled = 0; npolled < num_entries; ++npolled) {
		do {
			err = c4iw_poll_cq_one(chp, wc + npolled);
		} while (err == -EAGAIN);
		if (err)
			break;
	}
	spin_unlock_irqrestore(&chp->lock, flags);
	return !err || err == -ENODATA ? npolled : err;
}

int c4iw_destroy_cq(struct ib_cq *ib_cq)
{
	struct c4iw_cq *chp;
	struct c4iw_ucontext *ucontext;

976
	pr_debug("ib_cq %p\n", ib_cq);
977 978 979 980 981 982 983 984 985
	chp = to_c4iw_cq(ib_cq);

	remove_handle(chp->rhp, &chp->rhp->cqidr, chp->cq.cqid);
	atomic_dec(&chp->refcnt);
	wait_event(chp->wait, !atomic_read(&chp->refcnt));

	ucontext = ib_cq->uobject ? to_c4iw_ucontext(ib_cq->uobject->context)
				  : NULL;
	destroy_cq(&chp->rhp->rdev, &chp->cq,
986
		   ucontext ? &ucontext->uctx : &chp->cq.rdev->uctx,
987
		   chp->destroy_skb, chp->wr_waitp);
988
	c4iw_put_wr_wait(chp->wr_waitp);
989 990 991 992
	kfree(chp);
	return 0;
}

993 994 995
struct ib_cq *c4iw_create_cq(struct ib_device *ibdev,
			     const struct ib_cq_init_attr *attr,
			     struct ib_ucontext *ib_context,
996 997
			     struct ib_udata *udata)
{
998 999
	int entries = attr->cqe;
	int vector = attr->comp_vector;
1000 1001
	struct c4iw_dev *rhp;
	struct c4iw_cq *chp;
1002
	struct c4iw_create_cq ucmd;
1003 1004
	struct c4iw_create_cq_resp uresp;
	struct c4iw_ucontext *ucontext = NULL;
1005
	int ret, wr_len;
1006
	size_t memsize, hwentries;
1007 1008
	struct c4iw_mm_entry *mm, *mm2;

1009
	pr_debug("ib_dev %p entries %d\n", ibdev, entries);
1010 1011
	if (attr->flags)
		return ERR_PTR(-EINVAL);
1012 1013 1014

	rhp = to_c4iw_dev(ibdev);

1015 1016 1017
	if (vector >= rhp->rdev.lldi.nciq)
		return ERR_PTR(-EINVAL);

1018 1019 1020 1021 1022 1023
	if (ib_context) {
		ucontext = to_c4iw_ucontext(ib_context);
		if (udata->inlen < sizeof(ucmd))
			ucontext->is_32b_cqe = 1;
	}

1024 1025 1026
	chp = kzalloc(sizeof(*chp), GFP_KERNEL);
	if (!chp)
		return ERR_PTR(-ENOMEM);
1027

1028
	chp->wr_waitp = c4iw_alloc_wr_wait(GFP_KERNEL);
1029 1030 1031 1032 1033
	if (!chp->wr_waitp) {
		ret = -ENOMEM;
		goto err_free_chp;
	}
	c4iw_init_wr_wait(chp->wr_waitp);
1034

1035 1036 1037 1038
	wr_len = sizeof(struct fw_ri_res_wr) + sizeof(struct fw_ri_res);
	chp->destroy_skb = alloc_skb(wr_len, GFP_KERNEL);
	if (!chp->destroy_skb) {
		ret = -ENOMEM;
1039
		goto err_free_wr_wait;
1040 1041
	}

1042 1043 1044
	/* account for the status page. */
	entries++;

1045 1046 1047
	/* IQ needs one extra entry to differentiate full vs empty. */
	entries++;

1048 1049 1050 1051
	/*
	 * entries must be multiple of 16 for HW.
	 */
	entries = roundup(entries, 16);
1052 1053 1054 1055

	/*
	 * Make actual HW queue 2x to avoid cdix_inc overflows.
	 */
1056
	hwentries = min(entries * 2, rhp->rdev.hw_queue.t4_max_iq_size);
1057 1058 1059 1060 1061 1062 1063 1064

	/*
	 * Make HW queue at least 64 entries so GTS updates aren't too
	 * frequent.
	 */
	if (hwentries < 64)
		hwentries = 64;

1065 1066
	memsize = hwentries * ((ucontext && ucontext->is_32b_cqe) ?
			(sizeof(*chp->cq.queue) / 2) : sizeof(*chp->cq.queue));
1067 1068 1069 1070

	/*
	 * memsize must be a multiple of the page size if its a user cq.
	 */
1071
	if (ucontext)
1072
		memsize = roundup(memsize, PAGE_SIZE);
1073

1074
	chp->cq.size = hwentries;
1075
	chp->cq.memsize = memsize;
1076
	chp->cq.vector = vector;
1077 1078

	ret = create_cq(&rhp->rdev, &chp->cq,
1079 1080
			ucontext ? &ucontext->uctx : &rhp->rdev.uctx,
			chp->wr_waitp);
1081
	if (ret)
1082
		goto err_free_skb;
1083 1084 1085

	chp->rhp = rhp;
	chp->cq.size--;				/* status page */
1086
	chp->ibcq.cqe = entries - 2;
1087
	spin_lock_init(&chp->lock);
1088
	spin_lock_init(&chp->comp_handler_lock);
1089 1090 1091 1092
	atomic_set(&chp->refcnt, 1);
	init_waitqueue_head(&chp->wait);
	ret = insert_handle(rhp, &rhp->cqidr, chp, chp->cq.cqid);
	if (ret)
1093
		goto err_destroy_cq;
1094 1095

	if (ucontext) {
1096
		ret = -ENOMEM;
1097 1098
		mm = kmalloc(sizeof *mm, GFP_KERNEL);
		if (!mm)
1099
			goto err_remove_handle;
1100 1101
		mm2 = kmalloc(sizeof *mm2, GFP_KERNEL);
		if (!mm2)
1102
			goto err_free_mm;
1103

1104
		memset(&uresp, 0, sizeof(uresp));
1105 1106 1107 1108 1109 1110 1111 1112 1113
		uresp.qid_mask = rhp->rdev.cqmask;
		uresp.cqid = chp->cq.cqid;
		uresp.size = chp->cq.size;
		uresp.memsize = chp->cq.memsize;
		spin_lock(&ucontext->mmap_lock);
		uresp.key = ucontext->key;
		ucontext->key += PAGE_SIZE;
		uresp.gts_key = ucontext->key;
		ucontext->key += PAGE_SIZE;
1114 1115 1116 1117 1118
		/* communicate to the userspace that
		 * kernel driver supports 64B CQE
		 */
		uresp.flags |= C4IW_64B_CQE;

1119
		spin_unlock(&ucontext->mmap_lock);
1120
		ret = ib_copy_to_udata(udata, &uresp,
1121 1122 1123
				       ucontext->is_32b_cqe ?
				       sizeof(uresp) - sizeof(uresp.flags) :
				       sizeof(uresp));
1124
		if (ret)
1125
			goto err_free_mm2;
1126 1127 1128 1129 1130 1131 1132

		mm->key = uresp.key;
		mm->addr = virt_to_phys(chp->cq.queue);
		mm->len = chp->cq.memsize;
		insert_mmap(ucontext, mm);

		mm2->key = uresp.gts_key;
1133
		mm2->addr = chp->cq.bar2_pa;
1134 1135 1136
		mm2->len = PAGE_SIZE;
		insert_mmap(ucontext, mm2);
	}
1137 1138
	pr_debug("cqid 0x%0x chp %p size %u memsize %zu, dma_addr 0x%0llx\n",
		 chp->cq.cqid, chp, chp->cq.size,
J
Joe Perches 已提交
1139
		 chp->cq.memsize, (unsigned long long)chp->cq.dma_addr);
1140
	return &chp->ibcq;
1141
err_free_mm2:
1142
	kfree(mm2);
1143
err_free_mm:
1144
	kfree(mm);
1145
err_remove_handle:
1146
	remove_handle(rhp, &rhp->cqidr, chp->cq.cqid);
1147
err_destroy_cq:
1148
	destroy_cq(&chp->rhp->rdev, &chp->cq,
1149
		   ucontext ? &ucontext->uctx : &rhp->rdev.uctx,
1150 1151
		   chp->destroy_skb, chp->wr_waitp);
err_free_skb:
1152
	kfree_skb(chp->destroy_skb);
1153
err_free_wr_wait:
1154
	c4iw_put_wr_wait(chp->wr_waitp);
1155
err_free_chp:
1156 1157 1158 1159 1160 1161 1162
	kfree(chp);
	return ERR_PTR(ret);
}

int c4iw_arm_cq(struct ib_cq *ibcq, enum ib_cq_notify_flags flags)
{
	struct c4iw_cq *chp;
1163
	int ret = 0;
1164 1165 1166 1167
	unsigned long flag;

	chp = to_c4iw_cq(ibcq);
	spin_lock_irqsave(&chp->lock, flag);
1168 1169 1170 1171
	t4_arm_cq(&chp->cq,
		  (flags & IB_CQ_SOLICITED_MASK) == IB_CQ_SOLICITED);
	if (flags & IB_CQ_REPORT_MISSED_EVENTS)
		ret = t4_cq_notempty(&chp->cq);
1172 1173 1174
	spin_unlock_irqrestore(&chp->lock, flag);
	return ret;
}
1175 1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190

void c4iw_flush_srqidx(struct c4iw_qp *qhp, u32 srqidx)
{
	struct c4iw_cq *rchp = to_c4iw_cq(qhp->ibqp.recv_cq);
	unsigned long flag;

	/* locking heirarchy: cq lock first, then qp lock. */
	spin_lock_irqsave(&rchp->lock, flag);
	spin_lock(&qhp->lock);

	/* create a SRQ RECV CQE for srqidx */
	insert_recv_cqe(&qhp->wq, &rchp->cq, srqidx);

	spin_unlock(&qhp->lock);
	spin_unlock_irqrestore(&rchp->lock, flag);
}