Linux Audio

Check our new training course

Loading...
v6.8
  1// SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause
  2/*
  3 * Copyright(c) 2015 - 2018 Intel Corporation.
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
  4 */
  5
  6#include "hfi.h"
  7#include "verbs_txreq.h"
  8#include "qp.h"
  9
 10/* cut down ridiculously long IB macro names */
 11#define OP(x) UC_OP(x)
 12
 13/**
 14 * hfi1_make_uc_req - construct a request packet (SEND, RDMA write)
 15 * @qp: a pointer to the QP
 16 * @ps: the current packet state
 17 *
 18 * Assume s_lock is held.
 19 *
 20 * Return 1 if constructed; otherwise, return 0.
 21 */
 22int hfi1_make_uc_req(struct rvt_qp *qp, struct hfi1_pkt_state *ps)
 23{
 24	struct hfi1_qp_priv *priv = qp->priv;
 25	struct ib_other_headers *ohdr;
 26	struct rvt_swqe *wqe;
 27	u32 hwords;
 28	u32 bth0 = 0;
 29	u32 len;
 30	u32 pmtu = qp->pmtu;
 31	int middle = 0;
 32
 33	ps->s_txreq = get_txreq(ps->dev, qp);
 34	if (!ps->s_txreq)
 35		goto bail_no_tx;
 36
 37	if (!(ib_rvt_state_ops[qp->state] & RVT_PROCESS_SEND_OK)) {
 38		if (!(ib_rvt_state_ops[qp->state] & RVT_FLUSH_SEND))
 39			goto bail;
 40		/* We are in the error state, flush the work request. */
 41		if (qp->s_last == READ_ONCE(qp->s_head))
 42			goto bail;
 43		/* If DMAs are in progress, we can't flush immediately. */
 44		if (iowait_sdma_pending(&priv->s_iowait)) {
 45			qp->s_flags |= RVT_S_WAIT_DMA;
 46			goto bail;
 47		}
 48		clear_ahg(qp);
 49		wqe = rvt_get_swqe_ptr(qp, qp->s_last);
 50		rvt_send_complete(qp, wqe, IB_WC_WR_FLUSH_ERR);
 51		goto done_free_tx;
 52	}
 53
 54	if (priv->hdr_type == HFI1_PKT_TYPE_9B) {
 55		/* header size in 32-bit words LRH+BTH = (8+12)/4. */
 56		hwords = 5;
 57		if (rdma_ah_get_ah_flags(&qp->remote_ah_attr) & IB_AH_GRH)
 58			ohdr = &ps->s_txreq->phdr.hdr.ibh.u.l.oth;
 59		else
 60			ohdr = &ps->s_txreq->phdr.hdr.ibh.u.oth;
 61	} else {
 62		/* header size in 32-bit words 16B LRH+BTH = (16+12)/4. */
 63		hwords = 7;
 64		if ((rdma_ah_get_ah_flags(&qp->remote_ah_attr) & IB_AH_GRH) &&
 65		    (hfi1_check_mcast(rdma_ah_get_dlid(&qp->remote_ah_attr))))
 66			ohdr = &ps->s_txreq->phdr.hdr.opah.u.l.oth;
 67		else
 68			ohdr = &ps->s_txreq->phdr.hdr.opah.u.oth;
 69	}
 70
 71	/* Get the next send request. */
 72	wqe = rvt_get_swqe_ptr(qp, qp->s_cur);
 73	qp->s_wqe = NULL;
 74	switch (qp->s_state) {
 75	default:
 76		if (!(ib_rvt_state_ops[qp->state] &
 77		    RVT_PROCESS_NEXT_SEND_OK))
 78			goto bail;
 79		/* Check if send work queue is empty. */
 80		if (qp->s_cur == READ_ONCE(qp->s_head)) {
 81			clear_ahg(qp);
 82			goto bail;
 83		}
 84		/*
 85		 * Local operations are processed immediately
 86		 * after all prior requests have completed.
 87		 */
 88		if (wqe->wr.opcode == IB_WR_REG_MR ||
 89		    wqe->wr.opcode == IB_WR_LOCAL_INV) {
 90			int local_ops = 0;
 91			int err = 0;
 92
 93			if (qp->s_last != qp->s_cur)
 94				goto bail;
 95			if (++qp->s_cur == qp->s_size)
 96				qp->s_cur = 0;
 97			if (!(wqe->wr.send_flags & RVT_SEND_COMPLETION_ONLY)) {
 98				err = rvt_invalidate_rkey(
 99					qp, wqe->wr.ex.invalidate_rkey);
100				local_ops = 1;
101			}
102			rvt_send_complete(qp, wqe, err ? IB_WC_LOC_PROT_ERR
103							: IB_WC_SUCCESS);
104			if (local_ops)
105				atomic_dec(&qp->local_ops_pending);
106			goto done_free_tx;
107		}
108		/*
109		 * Start a new request.
110		 */
111		qp->s_psn = wqe->psn;
112		qp->s_sge.sge = wqe->sg_list[0];
113		qp->s_sge.sg_list = wqe->sg_list + 1;
114		qp->s_sge.num_sge = wqe->wr.num_sge;
115		qp->s_sge.total_len = wqe->length;
116		len = wqe->length;
117		qp->s_len = len;
118		switch (wqe->wr.opcode) {
119		case IB_WR_SEND:
120		case IB_WR_SEND_WITH_IMM:
121			if (len > pmtu) {
122				qp->s_state = OP(SEND_FIRST);
123				len = pmtu;
124				break;
125			}
126			if (wqe->wr.opcode == IB_WR_SEND) {
127				qp->s_state = OP(SEND_ONLY);
128			} else {
129				qp->s_state =
130					OP(SEND_ONLY_WITH_IMMEDIATE);
131				/* Immediate data comes after the BTH */
132				ohdr->u.imm_data = wqe->wr.ex.imm_data;
133				hwords += 1;
134			}
135			if (wqe->wr.send_flags & IB_SEND_SOLICITED)
136				bth0 |= IB_BTH_SOLICITED;
137			qp->s_wqe = wqe;
138			if (++qp->s_cur >= qp->s_size)
139				qp->s_cur = 0;
140			break;
141
142		case IB_WR_RDMA_WRITE:
143		case IB_WR_RDMA_WRITE_WITH_IMM:
144			ohdr->u.rc.reth.vaddr =
145				cpu_to_be64(wqe->rdma_wr.remote_addr);
146			ohdr->u.rc.reth.rkey =
147				cpu_to_be32(wqe->rdma_wr.rkey);
148			ohdr->u.rc.reth.length = cpu_to_be32(len);
149			hwords += sizeof(struct ib_reth) / 4;
150			if (len > pmtu) {
151				qp->s_state = OP(RDMA_WRITE_FIRST);
152				len = pmtu;
153				break;
154			}
155			if (wqe->wr.opcode == IB_WR_RDMA_WRITE) {
156				qp->s_state = OP(RDMA_WRITE_ONLY);
157			} else {
158				qp->s_state =
159					OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE);
160				/* Immediate data comes after the RETH */
161				ohdr->u.rc.imm_data = wqe->wr.ex.imm_data;
162				hwords += 1;
163				if (wqe->wr.send_flags & IB_SEND_SOLICITED)
164					bth0 |= IB_BTH_SOLICITED;
165			}
166			qp->s_wqe = wqe;
167			if (++qp->s_cur >= qp->s_size)
168				qp->s_cur = 0;
169			break;
170
171		default:
172			goto bail;
173		}
174		break;
175
176	case OP(SEND_FIRST):
177		qp->s_state = OP(SEND_MIDDLE);
178		fallthrough;
179	case OP(SEND_MIDDLE):
180		len = qp->s_len;
181		if (len > pmtu) {
182			len = pmtu;
183			middle = HFI1_CAP_IS_KSET(SDMA_AHG);
184			break;
185		}
186		if (wqe->wr.opcode == IB_WR_SEND) {
187			qp->s_state = OP(SEND_LAST);
188		} else {
189			qp->s_state = OP(SEND_LAST_WITH_IMMEDIATE);
190			/* Immediate data comes after the BTH */
191			ohdr->u.imm_data = wqe->wr.ex.imm_data;
192			hwords += 1;
193		}
194		if (wqe->wr.send_flags & IB_SEND_SOLICITED)
195			bth0 |= IB_BTH_SOLICITED;
196		qp->s_wqe = wqe;
197		if (++qp->s_cur >= qp->s_size)
198			qp->s_cur = 0;
199		break;
200
201	case OP(RDMA_WRITE_FIRST):
202		qp->s_state = OP(RDMA_WRITE_MIDDLE);
203		fallthrough;
204	case OP(RDMA_WRITE_MIDDLE):
205		len = qp->s_len;
206		if (len > pmtu) {
207			len = pmtu;
208			middle = HFI1_CAP_IS_KSET(SDMA_AHG);
209			break;
210		}
211		if (wqe->wr.opcode == IB_WR_RDMA_WRITE) {
212			qp->s_state = OP(RDMA_WRITE_LAST);
213		} else {
214			qp->s_state =
215				OP(RDMA_WRITE_LAST_WITH_IMMEDIATE);
216			/* Immediate data comes after the BTH */
217			ohdr->u.imm_data = wqe->wr.ex.imm_data;
218			hwords += 1;
219			if (wqe->wr.send_flags & IB_SEND_SOLICITED)
220				bth0 |= IB_BTH_SOLICITED;
221		}
222		qp->s_wqe = wqe;
223		if (++qp->s_cur >= qp->s_size)
224			qp->s_cur = 0;
225		break;
226	}
227	qp->s_len -= len;
228	ps->s_txreq->hdr_dwords = hwords;
229	ps->s_txreq->sde = priv->s_sde;
230	ps->s_txreq->ss = &qp->s_sge;
231	ps->s_txreq->s_cur_size = len;
232	hfi1_make_ruc_header(qp, ohdr, bth0 | (qp->s_state << 24),
233			     qp->remote_qpn, mask_psn(qp->s_psn++),
234			     middle, ps);
235	return 1;
236
237done_free_tx:
238	hfi1_put_txreq(ps->s_txreq);
239	ps->s_txreq = NULL;
240	return 1;
241
242bail:
243	hfi1_put_txreq(ps->s_txreq);
244
245bail_no_tx:
246	ps->s_txreq = NULL;
247	qp->s_flags &= ~RVT_S_BUSY;
248	return 0;
249}
250
251/**
252 * hfi1_uc_rcv - handle an incoming UC packet
253 * @packet: the packet structure
 
 
 
 
 
254 *
255 * This is called from qp_rcv() to process an incoming UC packet
256 * for the given QP.
257 * Called at interrupt level.
258 */
259void hfi1_uc_rcv(struct hfi1_packet *packet)
260{
261	struct hfi1_ibport *ibp = rcd_to_iport(packet->rcd);
262	void *data = packet->payload;
263	u32 tlen = packet->tlen;
264	struct rvt_qp *qp = packet->qp;
265	struct ib_other_headers *ohdr = packet->ohdr;
266	u32 opcode = packet->opcode;
267	u32 hdrsize = packet->hlen;
268	u32 psn;
269	u32 pad = packet->pad;
270	struct ib_wc wc;
271	u32 pmtu = qp->pmtu;
272	struct ib_reth *reth;
273	int ret;
274	u8 extra_bytes = pad + packet->extra_byte + (SIZE_OF_CRC << 2);
275
276	if (hfi1_ruc_check_hdr(ibp, packet))
277		return;
278
279	process_ecn(qp, packet);
280
281	psn = ib_bth_get_psn(ohdr);
282	/* Compare the PSN verses the expected PSN. */
283	if (unlikely(cmp_psn(psn, qp->r_psn) != 0)) {
284		/*
285		 * Handle a sequence error.
286		 * Silently drop any current message.
287		 */
288		qp->r_psn = psn;
289inv:
290		if (qp->r_state == OP(SEND_FIRST) ||
291		    qp->r_state == OP(SEND_MIDDLE)) {
292			set_bit(RVT_R_REWIND_SGE, &qp->r_aflags);
293			qp->r_sge.num_sge = 0;
294		} else {
295			rvt_put_ss(&qp->r_sge);
296		}
297		qp->r_state = OP(SEND_LAST);
298		switch (opcode) {
299		case OP(SEND_FIRST):
300		case OP(SEND_ONLY):
301		case OP(SEND_ONLY_WITH_IMMEDIATE):
302			goto send_first;
303
304		case OP(RDMA_WRITE_FIRST):
305		case OP(RDMA_WRITE_ONLY):
306		case OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE):
307			goto rdma_first;
308
309		default:
310			goto drop;
311		}
312	}
313
314	/* Check for opcode sequence errors. */
315	switch (qp->r_state) {
316	case OP(SEND_FIRST):
317	case OP(SEND_MIDDLE):
318		if (opcode == OP(SEND_MIDDLE) ||
319		    opcode == OP(SEND_LAST) ||
320		    opcode == OP(SEND_LAST_WITH_IMMEDIATE))
321			break;
322		goto inv;
323
324	case OP(RDMA_WRITE_FIRST):
325	case OP(RDMA_WRITE_MIDDLE):
326		if (opcode == OP(RDMA_WRITE_MIDDLE) ||
327		    opcode == OP(RDMA_WRITE_LAST) ||
328		    opcode == OP(RDMA_WRITE_LAST_WITH_IMMEDIATE))
329			break;
330		goto inv;
331
332	default:
333		if (opcode == OP(SEND_FIRST) ||
334		    opcode == OP(SEND_ONLY) ||
335		    opcode == OP(SEND_ONLY_WITH_IMMEDIATE) ||
336		    opcode == OP(RDMA_WRITE_FIRST) ||
337		    opcode == OP(RDMA_WRITE_ONLY) ||
338		    opcode == OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE))
339			break;
340		goto inv;
341	}
342
343	if (qp->state == IB_QPS_RTR && !(qp->r_flags & RVT_R_COMM_EST))
344		rvt_comm_est(qp);
345
346	/* OK, process the packet. */
347	switch (opcode) {
348	case OP(SEND_FIRST):
349	case OP(SEND_ONLY):
350	case OP(SEND_ONLY_WITH_IMMEDIATE):
351send_first:
352		if (test_and_clear_bit(RVT_R_REWIND_SGE, &qp->r_aflags)) {
353			qp->r_sge = qp->s_rdma_read_sge;
354		} else {
355			ret = rvt_get_rwqe(qp, false);
356			if (ret < 0)
357				goto op_err;
358			if (!ret)
359				goto drop;
360			/*
361			 * qp->s_rdma_read_sge will be the owner
362			 * of the mr references.
363			 */
364			qp->s_rdma_read_sge = qp->r_sge;
365		}
366		qp->r_rcv_len = 0;
367		if (opcode == OP(SEND_ONLY))
368			goto no_immediate_data;
369		else if (opcode == OP(SEND_ONLY_WITH_IMMEDIATE))
370			goto send_last_imm;
371		fallthrough;
372	case OP(SEND_MIDDLE):
373		/* Check for invalid length PMTU or posted rwqe len. */
374		/*
375		 * There will be no padding for 9B packet but 16B packets
376		 * will come in with some padding since we always add
377		 * CRC and LT bytes which will need to be flit aligned
378		 */
379		if (unlikely(tlen != (hdrsize + pmtu + extra_bytes)))
380			goto rewind;
381		qp->r_rcv_len += pmtu;
382		if (unlikely(qp->r_rcv_len > qp->r_len))
383			goto rewind;
384		rvt_copy_sge(qp, &qp->r_sge, data, pmtu, false, false);
385		break;
386
387	case OP(SEND_LAST_WITH_IMMEDIATE):
388send_last_imm:
389		wc.ex.imm_data = ohdr->u.imm_data;
390		wc.wc_flags = IB_WC_WITH_IMM;
391		goto send_last;
392	case OP(SEND_LAST):
393no_immediate_data:
394		wc.ex.imm_data = 0;
395		wc.wc_flags = 0;
396send_last:
397		/* Check for invalid length. */
398		/* LAST len should be >= 1 */
399		if (unlikely(tlen < (hdrsize + extra_bytes)))
400			goto rewind;
401		/* Don't count the CRC. */
402		tlen -= (hdrsize + extra_bytes);
403		wc.byte_len = tlen + qp->r_rcv_len;
404		if (unlikely(wc.byte_len > qp->r_len))
405			goto rewind;
406		wc.opcode = IB_WC_RECV;
407		rvt_copy_sge(qp, &qp->r_sge, data, tlen, false, false);
408		rvt_put_ss(&qp->s_rdma_read_sge);
409last_imm:
410		wc.wr_id = qp->r_wr_id;
411		wc.status = IB_WC_SUCCESS;
412		wc.qp = &qp->ibqp;
413		wc.src_qp = qp->remote_qpn;
414		wc.slid = rdma_ah_get_dlid(&qp->remote_ah_attr) & U16_MAX;
415		/*
416		 * It seems that IB mandates the presence of an SL in a
417		 * work completion only for the UD transport (see section
418		 * 11.4.2 of IBTA Vol. 1).
419		 *
420		 * However, the way the SL is chosen below is consistent
421		 * with the way that IB/qib works and is trying avoid
422		 * introducing incompatibilities.
423		 *
424		 * See also OPA Vol. 1, section 9.7.6, and table 9-17.
425		 */
426		wc.sl = rdma_ah_get_sl(&qp->remote_ah_attr);
427		/* zero fields that are N/A */
428		wc.vendor_err = 0;
429		wc.pkey_index = 0;
430		wc.dlid_path_bits = 0;
431		wc.port_num = 0;
432		/* Signal completion event if the solicited bit is set. */
433		rvt_recv_cq(qp, &wc, ib_bth_is_solicited(ohdr));
434		break;
435
436	case OP(RDMA_WRITE_FIRST):
437	case OP(RDMA_WRITE_ONLY):
438	case OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE): /* consume RWQE */
439rdma_first:
440		if (unlikely(!(qp->qp_access_flags &
441			       IB_ACCESS_REMOTE_WRITE))) {
442			goto drop;
443		}
444		reth = &ohdr->u.rc.reth;
445		qp->r_len = be32_to_cpu(reth->length);
446		qp->r_rcv_len = 0;
447		qp->r_sge.sg_list = NULL;
448		if (qp->r_len != 0) {
449			u32 rkey = be32_to_cpu(reth->rkey);
450			u64 vaddr = be64_to_cpu(reth->vaddr);
451			int ok;
452
453			/* Check rkey */
454			ok = rvt_rkey_ok(qp, &qp->r_sge.sge, qp->r_len,
455					 vaddr, rkey, IB_ACCESS_REMOTE_WRITE);
456			if (unlikely(!ok))
457				goto drop;
458			qp->r_sge.num_sge = 1;
459		} else {
460			qp->r_sge.num_sge = 0;
461			qp->r_sge.sge.mr = NULL;
462			qp->r_sge.sge.vaddr = NULL;
463			qp->r_sge.sge.length = 0;
464			qp->r_sge.sge.sge_length = 0;
465		}
466		if (opcode == OP(RDMA_WRITE_ONLY)) {
467			goto rdma_last;
468		} else if (opcode == OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE)) {
469			wc.ex.imm_data = ohdr->u.rc.imm_data;
470			goto rdma_last_imm;
471		}
472		fallthrough;
473	case OP(RDMA_WRITE_MIDDLE):
474		/* Check for invalid length PMTU or posted rwqe len. */
475		if (unlikely(tlen != (hdrsize + pmtu + 4)))
476			goto drop;
477		qp->r_rcv_len += pmtu;
478		if (unlikely(qp->r_rcv_len > qp->r_len))
479			goto drop;
480		rvt_copy_sge(qp, &qp->r_sge, data, pmtu, true, false);
481		break;
482
483	case OP(RDMA_WRITE_LAST_WITH_IMMEDIATE):
484		wc.ex.imm_data = ohdr->u.imm_data;
485rdma_last_imm:
486		wc.wc_flags = IB_WC_WITH_IMM;
487
488		/* Check for invalid length. */
489		/* LAST len should be >= 1 */
490		if (unlikely(tlen < (hdrsize + pad + 4)))
491			goto drop;
492		/* Don't count the CRC. */
493		tlen -= (hdrsize + extra_bytes);
494		if (unlikely(tlen + qp->r_rcv_len != qp->r_len))
495			goto drop;
496		if (test_and_clear_bit(RVT_R_REWIND_SGE, &qp->r_aflags)) {
497			rvt_put_ss(&qp->s_rdma_read_sge);
498		} else {
499			ret = rvt_get_rwqe(qp, true);
500			if (ret < 0)
501				goto op_err;
502			if (!ret)
503				goto drop;
504		}
505		wc.byte_len = qp->r_len;
506		wc.opcode = IB_WC_RECV_RDMA_WITH_IMM;
507		rvt_copy_sge(qp, &qp->r_sge, data, tlen, true, false);
508		rvt_put_ss(&qp->r_sge);
509		goto last_imm;
510
511	case OP(RDMA_WRITE_LAST):
512rdma_last:
513		/* Check for invalid length. */
514		/* LAST len should be >= 1 */
515		if (unlikely(tlen < (hdrsize + pad + 4)))
516			goto drop;
517		/* Don't count the CRC. */
518		tlen -= (hdrsize + extra_bytes);
519		if (unlikely(tlen + qp->r_rcv_len != qp->r_len))
520			goto drop;
521		rvt_copy_sge(qp, &qp->r_sge, data, tlen, true, false);
522		rvt_put_ss(&qp->r_sge);
523		break;
524
525	default:
526		/* Drop packet for unknown opcodes. */
527		goto drop;
528	}
529	qp->r_psn++;
530	qp->r_state = opcode;
531	return;
532
533rewind:
534	set_bit(RVT_R_REWIND_SGE, &qp->r_aflags);
535	qp->r_sge.num_sge = 0;
536drop:
537	ibp->rvp.n_pkt_drops++;
538	return;
539
540op_err:
541	rvt_rc_error(qp, IB_WC_LOC_QP_OP_ERR);
542}
v5.4
 
  1/*
  2 * Copyright(c) 2015 - 2018 Intel Corporation.
  3 *
  4 * This file is provided under a dual BSD/GPLv2 license.  When using or
  5 * redistributing this file, you may do so under either license.
  6 *
  7 * GPL LICENSE SUMMARY
  8 *
  9 * This program is free software; you can redistribute it and/or modify
 10 * it under the terms of version 2 of the GNU General Public License as
 11 * published by the Free Software Foundation.
 12 *
 13 * This program is distributed in the hope that it will be useful, but
 14 * WITHOUT ANY WARRANTY; without even the implied warranty of
 15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 16 * General Public License for more details.
 17 *
 18 * BSD LICENSE
 19 *
 20 * Redistribution and use in source and binary forms, with or without
 21 * modification, are permitted provided that the following conditions
 22 * are met:
 23 *
 24 *  - Redistributions of source code must retain the above copyright
 25 *    notice, this list of conditions and the following disclaimer.
 26 *  - Redistributions in binary form must reproduce the above copyright
 27 *    notice, this list of conditions and the following disclaimer in
 28 *    the documentation and/or other materials provided with the
 29 *    distribution.
 30 *  - Neither the name of Intel Corporation nor the names of its
 31 *    contributors may be used to endorse or promote products derived
 32 *    from this software without specific prior written permission.
 33 *
 34 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 35 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 36 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 37 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 38 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 39 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 40 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 41 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 42 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 43 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 44 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 45 *
 46 */
 47
 48#include "hfi.h"
 49#include "verbs_txreq.h"
 50#include "qp.h"
 51
 52/* cut down ridiculously long IB macro names */
 53#define OP(x) UC_OP(x)
 54
 55/**
 56 * hfi1_make_uc_req - construct a request packet (SEND, RDMA write)
 57 * @qp: a pointer to the QP
 
 58 *
 59 * Assume s_lock is held.
 60 *
 61 * Return 1 if constructed; otherwise, return 0.
 62 */
 63int hfi1_make_uc_req(struct rvt_qp *qp, struct hfi1_pkt_state *ps)
 64{
 65	struct hfi1_qp_priv *priv = qp->priv;
 66	struct ib_other_headers *ohdr;
 67	struct rvt_swqe *wqe;
 68	u32 hwords;
 69	u32 bth0 = 0;
 70	u32 len;
 71	u32 pmtu = qp->pmtu;
 72	int middle = 0;
 73
 74	ps->s_txreq = get_txreq(ps->dev, qp);
 75	if (!ps->s_txreq)
 76		goto bail_no_tx;
 77
 78	if (!(ib_rvt_state_ops[qp->state] & RVT_PROCESS_SEND_OK)) {
 79		if (!(ib_rvt_state_ops[qp->state] & RVT_FLUSH_SEND))
 80			goto bail;
 81		/* We are in the error state, flush the work request. */
 82		if (qp->s_last == READ_ONCE(qp->s_head))
 83			goto bail;
 84		/* If DMAs are in progress, we can't flush immediately. */
 85		if (iowait_sdma_pending(&priv->s_iowait)) {
 86			qp->s_flags |= RVT_S_WAIT_DMA;
 87			goto bail;
 88		}
 89		clear_ahg(qp);
 90		wqe = rvt_get_swqe_ptr(qp, qp->s_last);
 91		rvt_send_complete(qp, wqe, IB_WC_WR_FLUSH_ERR);
 92		goto done_free_tx;
 93	}
 94
 95	if (priv->hdr_type == HFI1_PKT_TYPE_9B) {
 96		/* header size in 32-bit words LRH+BTH = (8+12)/4. */
 97		hwords = 5;
 98		if (rdma_ah_get_ah_flags(&qp->remote_ah_attr) & IB_AH_GRH)
 99			ohdr = &ps->s_txreq->phdr.hdr.ibh.u.l.oth;
100		else
101			ohdr = &ps->s_txreq->phdr.hdr.ibh.u.oth;
102	} else {
103		/* header size in 32-bit words 16B LRH+BTH = (16+12)/4. */
104		hwords = 7;
105		if ((rdma_ah_get_ah_flags(&qp->remote_ah_attr) & IB_AH_GRH) &&
106		    (hfi1_check_mcast(rdma_ah_get_dlid(&qp->remote_ah_attr))))
107			ohdr = &ps->s_txreq->phdr.hdr.opah.u.l.oth;
108		else
109			ohdr = &ps->s_txreq->phdr.hdr.opah.u.oth;
110	}
111
112	/* Get the next send request. */
113	wqe = rvt_get_swqe_ptr(qp, qp->s_cur);
114	qp->s_wqe = NULL;
115	switch (qp->s_state) {
116	default:
117		if (!(ib_rvt_state_ops[qp->state] &
118		    RVT_PROCESS_NEXT_SEND_OK))
119			goto bail;
120		/* Check if send work queue is empty. */
121		if (qp->s_cur == READ_ONCE(qp->s_head)) {
122			clear_ahg(qp);
123			goto bail;
124		}
125		/*
126		 * Local operations are processed immediately
127		 * after all prior requests have completed.
128		 */
129		if (wqe->wr.opcode == IB_WR_REG_MR ||
130		    wqe->wr.opcode == IB_WR_LOCAL_INV) {
131			int local_ops = 0;
132			int err = 0;
133
134			if (qp->s_last != qp->s_cur)
135				goto bail;
136			if (++qp->s_cur == qp->s_size)
137				qp->s_cur = 0;
138			if (!(wqe->wr.send_flags & RVT_SEND_COMPLETION_ONLY)) {
139				err = rvt_invalidate_rkey(
140					qp, wqe->wr.ex.invalidate_rkey);
141				local_ops = 1;
142			}
143			rvt_send_complete(qp, wqe, err ? IB_WC_LOC_PROT_ERR
144							: IB_WC_SUCCESS);
145			if (local_ops)
146				atomic_dec(&qp->local_ops_pending);
147			goto done_free_tx;
148		}
149		/*
150		 * Start a new request.
151		 */
152		qp->s_psn = wqe->psn;
153		qp->s_sge.sge = wqe->sg_list[0];
154		qp->s_sge.sg_list = wqe->sg_list + 1;
155		qp->s_sge.num_sge = wqe->wr.num_sge;
156		qp->s_sge.total_len = wqe->length;
157		len = wqe->length;
158		qp->s_len = len;
159		switch (wqe->wr.opcode) {
160		case IB_WR_SEND:
161		case IB_WR_SEND_WITH_IMM:
162			if (len > pmtu) {
163				qp->s_state = OP(SEND_FIRST);
164				len = pmtu;
165				break;
166			}
167			if (wqe->wr.opcode == IB_WR_SEND) {
168				qp->s_state = OP(SEND_ONLY);
169			} else {
170				qp->s_state =
171					OP(SEND_ONLY_WITH_IMMEDIATE);
172				/* Immediate data comes after the BTH */
173				ohdr->u.imm_data = wqe->wr.ex.imm_data;
174				hwords += 1;
175			}
176			if (wqe->wr.send_flags & IB_SEND_SOLICITED)
177				bth0 |= IB_BTH_SOLICITED;
178			qp->s_wqe = wqe;
179			if (++qp->s_cur >= qp->s_size)
180				qp->s_cur = 0;
181			break;
182
183		case IB_WR_RDMA_WRITE:
184		case IB_WR_RDMA_WRITE_WITH_IMM:
185			ohdr->u.rc.reth.vaddr =
186				cpu_to_be64(wqe->rdma_wr.remote_addr);
187			ohdr->u.rc.reth.rkey =
188				cpu_to_be32(wqe->rdma_wr.rkey);
189			ohdr->u.rc.reth.length = cpu_to_be32(len);
190			hwords += sizeof(struct ib_reth) / 4;
191			if (len > pmtu) {
192				qp->s_state = OP(RDMA_WRITE_FIRST);
193				len = pmtu;
194				break;
195			}
196			if (wqe->wr.opcode == IB_WR_RDMA_WRITE) {
197				qp->s_state = OP(RDMA_WRITE_ONLY);
198			} else {
199				qp->s_state =
200					OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE);
201				/* Immediate data comes after the RETH */
202				ohdr->u.rc.imm_data = wqe->wr.ex.imm_data;
203				hwords += 1;
204				if (wqe->wr.send_flags & IB_SEND_SOLICITED)
205					bth0 |= IB_BTH_SOLICITED;
206			}
207			qp->s_wqe = wqe;
208			if (++qp->s_cur >= qp->s_size)
209				qp->s_cur = 0;
210			break;
211
212		default:
213			goto bail;
214		}
215		break;
216
217	case OP(SEND_FIRST):
218		qp->s_state = OP(SEND_MIDDLE);
219		/* FALLTHROUGH */
220	case OP(SEND_MIDDLE):
221		len = qp->s_len;
222		if (len > pmtu) {
223			len = pmtu;
224			middle = HFI1_CAP_IS_KSET(SDMA_AHG);
225			break;
226		}
227		if (wqe->wr.opcode == IB_WR_SEND) {
228			qp->s_state = OP(SEND_LAST);
229		} else {
230			qp->s_state = OP(SEND_LAST_WITH_IMMEDIATE);
231			/* Immediate data comes after the BTH */
232			ohdr->u.imm_data = wqe->wr.ex.imm_data;
233			hwords += 1;
234		}
235		if (wqe->wr.send_flags & IB_SEND_SOLICITED)
236			bth0 |= IB_BTH_SOLICITED;
237		qp->s_wqe = wqe;
238		if (++qp->s_cur >= qp->s_size)
239			qp->s_cur = 0;
240		break;
241
242	case OP(RDMA_WRITE_FIRST):
243		qp->s_state = OP(RDMA_WRITE_MIDDLE);
244		/* FALLTHROUGH */
245	case OP(RDMA_WRITE_MIDDLE):
246		len = qp->s_len;
247		if (len > pmtu) {
248			len = pmtu;
249			middle = HFI1_CAP_IS_KSET(SDMA_AHG);
250			break;
251		}
252		if (wqe->wr.opcode == IB_WR_RDMA_WRITE) {
253			qp->s_state = OP(RDMA_WRITE_LAST);
254		} else {
255			qp->s_state =
256				OP(RDMA_WRITE_LAST_WITH_IMMEDIATE);
257			/* Immediate data comes after the BTH */
258			ohdr->u.imm_data = wqe->wr.ex.imm_data;
259			hwords += 1;
260			if (wqe->wr.send_flags & IB_SEND_SOLICITED)
261				bth0 |= IB_BTH_SOLICITED;
262		}
263		qp->s_wqe = wqe;
264		if (++qp->s_cur >= qp->s_size)
265			qp->s_cur = 0;
266		break;
267	}
268	qp->s_len -= len;
269	ps->s_txreq->hdr_dwords = hwords;
270	ps->s_txreq->sde = priv->s_sde;
271	ps->s_txreq->ss = &qp->s_sge;
272	ps->s_txreq->s_cur_size = len;
273	hfi1_make_ruc_header(qp, ohdr, bth0 | (qp->s_state << 24),
274			     qp->remote_qpn, mask_psn(qp->s_psn++),
275			     middle, ps);
276	return 1;
277
278done_free_tx:
279	hfi1_put_txreq(ps->s_txreq);
280	ps->s_txreq = NULL;
281	return 1;
282
283bail:
284	hfi1_put_txreq(ps->s_txreq);
285
286bail_no_tx:
287	ps->s_txreq = NULL;
288	qp->s_flags &= ~RVT_S_BUSY;
289	return 0;
290}
291
292/**
293 * hfi1_uc_rcv - handle an incoming UC packet
294 * @ibp: the port the packet came in on
295 * @hdr: the header of the packet
296 * @rcv_flags: flags relevant to rcv processing
297 * @data: the packet data
298 * @tlen: the length of the packet
299 * @qp: the QP for this packet.
300 *
301 * This is called from qp_rcv() to process an incoming UC packet
302 * for the given QP.
303 * Called at interrupt level.
304 */
305void hfi1_uc_rcv(struct hfi1_packet *packet)
306{
307	struct hfi1_ibport *ibp = rcd_to_iport(packet->rcd);
308	void *data = packet->payload;
309	u32 tlen = packet->tlen;
310	struct rvt_qp *qp = packet->qp;
311	struct ib_other_headers *ohdr = packet->ohdr;
312	u32 opcode = packet->opcode;
313	u32 hdrsize = packet->hlen;
314	u32 psn;
315	u32 pad = packet->pad;
316	struct ib_wc wc;
317	u32 pmtu = qp->pmtu;
318	struct ib_reth *reth;
319	int ret;
320	u8 extra_bytes = pad + packet->extra_byte + (SIZE_OF_CRC << 2);
321
322	if (hfi1_ruc_check_hdr(ibp, packet))
323		return;
324
325	process_ecn(qp, packet);
326
327	psn = ib_bth_get_psn(ohdr);
328	/* Compare the PSN verses the expected PSN. */
329	if (unlikely(cmp_psn(psn, qp->r_psn) != 0)) {
330		/*
331		 * Handle a sequence error.
332		 * Silently drop any current message.
333		 */
334		qp->r_psn = psn;
335inv:
336		if (qp->r_state == OP(SEND_FIRST) ||
337		    qp->r_state == OP(SEND_MIDDLE)) {
338			set_bit(RVT_R_REWIND_SGE, &qp->r_aflags);
339			qp->r_sge.num_sge = 0;
340		} else {
341			rvt_put_ss(&qp->r_sge);
342		}
343		qp->r_state = OP(SEND_LAST);
344		switch (opcode) {
345		case OP(SEND_FIRST):
346		case OP(SEND_ONLY):
347		case OP(SEND_ONLY_WITH_IMMEDIATE):
348			goto send_first;
349
350		case OP(RDMA_WRITE_FIRST):
351		case OP(RDMA_WRITE_ONLY):
352		case OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE):
353			goto rdma_first;
354
355		default:
356			goto drop;
357		}
358	}
359
360	/* Check for opcode sequence errors. */
361	switch (qp->r_state) {
362	case OP(SEND_FIRST):
363	case OP(SEND_MIDDLE):
364		if (opcode == OP(SEND_MIDDLE) ||
365		    opcode == OP(SEND_LAST) ||
366		    opcode == OP(SEND_LAST_WITH_IMMEDIATE))
367			break;
368		goto inv;
369
370	case OP(RDMA_WRITE_FIRST):
371	case OP(RDMA_WRITE_MIDDLE):
372		if (opcode == OP(RDMA_WRITE_MIDDLE) ||
373		    opcode == OP(RDMA_WRITE_LAST) ||
374		    opcode == OP(RDMA_WRITE_LAST_WITH_IMMEDIATE))
375			break;
376		goto inv;
377
378	default:
379		if (opcode == OP(SEND_FIRST) ||
380		    opcode == OP(SEND_ONLY) ||
381		    opcode == OP(SEND_ONLY_WITH_IMMEDIATE) ||
382		    opcode == OP(RDMA_WRITE_FIRST) ||
383		    opcode == OP(RDMA_WRITE_ONLY) ||
384		    opcode == OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE))
385			break;
386		goto inv;
387	}
388
389	if (qp->state == IB_QPS_RTR && !(qp->r_flags & RVT_R_COMM_EST))
390		rvt_comm_est(qp);
391
392	/* OK, process the packet. */
393	switch (opcode) {
394	case OP(SEND_FIRST):
395	case OP(SEND_ONLY):
396	case OP(SEND_ONLY_WITH_IMMEDIATE):
397send_first:
398		if (test_and_clear_bit(RVT_R_REWIND_SGE, &qp->r_aflags)) {
399			qp->r_sge = qp->s_rdma_read_sge;
400		} else {
401			ret = rvt_get_rwqe(qp, false);
402			if (ret < 0)
403				goto op_err;
404			if (!ret)
405				goto drop;
406			/*
407			 * qp->s_rdma_read_sge will be the owner
408			 * of the mr references.
409			 */
410			qp->s_rdma_read_sge = qp->r_sge;
411		}
412		qp->r_rcv_len = 0;
413		if (opcode == OP(SEND_ONLY))
414			goto no_immediate_data;
415		else if (opcode == OP(SEND_ONLY_WITH_IMMEDIATE))
416			goto send_last_imm;
417		/* FALLTHROUGH */
418	case OP(SEND_MIDDLE):
419		/* Check for invalid length PMTU or posted rwqe len. */
420		/*
421		 * There will be no padding for 9B packet but 16B packets
422		 * will come in with some padding since we always add
423		 * CRC and LT bytes which will need to be flit aligned
424		 */
425		if (unlikely(tlen != (hdrsize + pmtu + extra_bytes)))
426			goto rewind;
427		qp->r_rcv_len += pmtu;
428		if (unlikely(qp->r_rcv_len > qp->r_len))
429			goto rewind;
430		rvt_copy_sge(qp, &qp->r_sge, data, pmtu, false, false);
431		break;
432
433	case OP(SEND_LAST_WITH_IMMEDIATE):
434send_last_imm:
435		wc.ex.imm_data = ohdr->u.imm_data;
436		wc.wc_flags = IB_WC_WITH_IMM;
437		goto send_last;
438	case OP(SEND_LAST):
439no_immediate_data:
440		wc.ex.imm_data = 0;
441		wc.wc_flags = 0;
442send_last:
443		/* Check for invalid length. */
444		/* LAST len should be >= 1 */
445		if (unlikely(tlen < (hdrsize + extra_bytes)))
446			goto rewind;
447		/* Don't count the CRC. */
448		tlen -= (hdrsize + extra_bytes);
449		wc.byte_len = tlen + qp->r_rcv_len;
450		if (unlikely(wc.byte_len > qp->r_len))
451			goto rewind;
452		wc.opcode = IB_WC_RECV;
453		rvt_copy_sge(qp, &qp->r_sge, data, tlen, false, false);
454		rvt_put_ss(&qp->s_rdma_read_sge);
455last_imm:
456		wc.wr_id = qp->r_wr_id;
457		wc.status = IB_WC_SUCCESS;
458		wc.qp = &qp->ibqp;
459		wc.src_qp = qp->remote_qpn;
460		wc.slid = rdma_ah_get_dlid(&qp->remote_ah_attr) & U16_MAX;
461		/*
462		 * It seems that IB mandates the presence of an SL in a
463		 * work completion only for the UD transport (see section
464		 * 11.4.2 of IBTA Vol. 1).
465		 *
466		 * However, the way the SL is chosen below is consistent
467		 * with the way that IB/qib works and is trying avoid
468		 * introducing incompatibilities.
469		 *
470		 * See also OPA Vol. 1, section 9.7.6, and table 9-17.
471		 */
472		wc.sl = rdma_ah_get_sl(&qp->remote_ah_attr);
473		/* zero fields that are N/A */
474		wc.vendor_err = 0;
475		wc.pkey_index = 0;
476		wc.dlid_path_bits = 0;
477		wc.port_num = 0;
478		/* Signal completion event if the solicited bit is set. */
479		rvt_recv_cq(qp, &wc, ib_bth_is_solicited(ohdr));
480		break;
481
482	case OP(RDMA_WRITE_FIRST):
483	case OP(RDMA_WRITE_ONLY):
484	case OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE): /* consume RWQE */
485rdma_first:
486		if (unlikely(!(qp->qp_access_flags &
487			       IB_ACCESS_REMOTE_WRITE))) {
488			goto drop;
489		}
490		reth = &ohdr->u.rc.reth;
491		qp->r_len = be32_to_cpu(reth->length);
492		qp->r_rcv_len = 0;
493		qp->r_sge.sg_list = NULL;
494		if (qp->r_len != 0) {
495			u32 rkey = be32_to_cpu(reth->rkey);
496			u64 vaddr = be64_to_cpu(reth->vaddr);
497			int ok;
498
499			/* Check rkey */
500			ok = rvt_rkey_ok(qp, &qp->r_sge.sge, qp->r_len,
501					 vaddr, rkey, IB_ACCESS_REMOTE_WRITE);
502			if (unlikely(!ok))
503				goto drop;
504			qp->r_sge.num_sge = 1;
505		} else {
506			qp->r_sge.num_sge = 0;
507			qp->r_sge.sge.mr = NULL;
508			qp->r_sge.sge.vaddr = NULL;
509			qp->r_sge.sge.length = 0;
510			qp->r_sge.sge.sge_length = 0;
511		}
512		if (opcode == OP(RDMA_WRITE_ONLY)) {
513			goto rdma_last;
514		} else if (opcode == OP(RDMA_WRITE_ONLY_WITH_IMMEDIATE)) {
515			wc.ex.imm_data = ohdr->u.rc.imm_data;
516			goto rdma_last_imm;
517		}
518		/* FALLTHROUGH */
519	case OP(RDMA_WRITE_MIDDLE):
520		/* Check for invalid length PMTU or posted rwqe len. */
521		if (unlikely(tlen != (hdrsize + pmtu + 4)))
522			goto drop;
523		qp->r_rcv_len += pmtu;
524		if (unlikely(qp->r_rcv_len > qp->r_len))
525			goto drop;
526		rvt_copy_sge(qp, &qp->r_sge, data, pmtu, true, false);
527		break;
528
529	case OP(RDMA_WRITE_LAST_WITH_IMMEDIATE):
530		wc.ex.imm_data = ohdr->u.imm_data;
531rdma_last_imm:
532		wc.wc_flags = IB_WC_WITH_IMM;
533
534		/* Check for invalid length. */
535		/* LAST len should be >= 1 */
536		if (unlikely(tlen < (hdrsize + pad + 4)))
537			goto drop;
538		/* Don't count the CRC. */
539		tlen -= (hdrsize + extra_bytes);
540		if (unlikely(tlen + qp->r_rcv_len != qp->r_len))
541			goto drop;
542		if (test_and_clear_bit(RVT_R_REWIND_SGE, &qp->r_aflags)) {
543			rvt_put_ss(&qp->s_rdma_read_sge);
544		} else {
545			ret = rvt_get_rwqe(qp, true);
546			if (ret < 0)
547				goto op_err;
548			if (!ret)
549				goto drop;
550		}
551		wc.byte_len = qp->r_len;
552		wc.opcode = IB_WC_RECV_RDMA_WITH_IMM;
553		rvt_copy_sge(qp, &qp->r_sge, data, tlen, true, false);
554		rvt_put_ss(&qp->r_sge);
555		goto last_imm;
556
557	case OP(RDMA_WRITE_LAST):
558rdma_last:
559		/* Check for invalid length. */
560		/* LAST len should be >= 1 */
561		if (unlikely(tlen < (hdrsize + pad + 4)))
562			goto drop;
563		/* Don't count the CRC. */
564		tlen -= (hdrsize + extra_bytes);
565		if (unlikely(tlen + qp->r_rcv_len != qp->r_len))
566			goto drop;
567		rvt_copy_sge(qp, &qp->r_sge, data, tlen, true, false);
568		rvt_put_ss(&qp->r_sge);
569		break;
570
571	default:
572		/* Drop packet for unknown opcodes. */
573		goto drop;
574	}
575	qp->r_psn++;
576	qp->r_state = opcode;
577	return;
578
579rewind:
580	set_bit(RVT_R_REWIND_SGE, &qp->r_aflags);
581	qp->r_sge.num_sge = 0;
582drop:
583	ibp->rvp.n_pkt_drops++;
584	return;
585
586op_err:
587	rvt_rc_error(qp, IB_WC_LOC_QP_OP_ERR);
588}