Linux Audio

Check our new training course

Loading...
v6.8
  1/* SPDX-License-Identifier: GPL-2.0 OR BSD-3-Clause */
 
  2/*
  3 * Copyright(c) 2023 - Cornelis Networks, Inc.
  4 * Copyright(c) 2015 - 2018 Intel Corporation.
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
  5 */
  6#ifndef _HFI1_USER_SDMA_H
  7#define _HFI1_USER_SDMA_H
  8
  9#include <linux/device.h>
 10#include <linux/wait.h>
 11
 12#include "common.h"
 13#include "iowait.h"
 14#include "user_exp_rcv.h"
 15#include "mmu_rb.h"
 16#include "pinning.h"
 17#include "sdma.h"
 18
 19/* The maximum number of Data io vectors per message/request */
 20#define MAX_VECTORS_PER_REQ 8
 21/*
 22 * Maximum number of packet to send from each message/request
 23 * before moving to the next one.
 24 */
 25#define MAX_PKTS_PER_QUEUE 16
 26
 27#define num_pages(x) (1 + ((((x) - 1) & PAGE_MASK) >> PAGE_SHIFT))
 28
 29#define req_opcode(x) \
 30	(((x) >> HFI1_SDMA_REQ_OPCODE_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK)
 31#define req_version(x) \
 32	(((x) >> HFI1_SDMA_REQ_VERSION_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK)
 33#define req_iovcnt(x) \
 34	(((x) >> HFI1_SDMA_REQ_IOVCNT_SHIFT) & HFI1_SDMA_REQ_IOVCNT_MASK)
 35
 36/* Number of BTH.PSN bits used for sequence number in expected rcvs */
 37#define BTH_SEQ_MASK 0x7ffull
 38
 39#define AHG_KDETH_INTR_SHIFT 12
 40#define AHG_KDETH_SH_SHIFT   13
 41#define AHG_KDETH_ARRAY_SIZE  9
 42
 43#define PBC2LRH(x) ((((x) & 0xfff) << 2) - 4)
 44#define LRH2PBC(x) ((((x) >> 2) + 1) & 0xfff)
 45
 46/**
 47 * Build an SDMA AHG header update descriptor and save it to an array.
 48 * @arr        - Array to save the descriptor to.
 49 * @idx        - Index of the array at which the descriptor will be saved.
 50 * @array_size - Size of the array arr.
 51 * @dw         - Update index into the header in DWs.
 52 * @bit        - Start bit.
 53 * @width      - Field width.
 54 * @value      - 16 bits of immediate data to write into the field.
 55 * Returns -ERANGE if idx is invalid. If successful, returns the next index
 56 * (idx + 1) of the array to be used for the next descriptor.
 57 */
 58static inline int ahg_header_set(u32 *arr, int idx, size_t array_size,
 59				 u8 dw, u8 bit, u8 width, u16 value)
 60{
 61	if ((size_t)idx >= array_size)
 62		return -ERANGE;
 63	arr[idx++] = sdma_build_ahg_descriptor(value, dw, bit, width);
 64	return idx;
 65}
 66
 67/* Tx request flag bits */
 68#define TXREQ_FLAGS_REQ_ACK   BIT(0)      /* Set the ACK bit in the header */
 69#define TXREQ_FLAGS_REQ_DISABLE_SH BIT(1) /* Disable header suppression */
 70
 71enum pkt_q_sdma_state {
 72	SDMA_PKT_Q_ACTIVE,
 73	SDMA_PKT_Q_DEFERRED,
 74};
 75
 76#define SDMA_IOWAIT_TIMEOUT 1000 /* in milliseconds */
 77
 78#define SDMA_DBG(req, fmt, ...)				     \
 79	hfi1_cdbg(SDMA, "[%u:%u:%u:%u] " fmt, (req)->pq->dd->unit, \
 80		 (req)->pq->ctxt, (req)->pq->subctxt, (req)->info.comp_idx, \
 81		 ##__VA_ARGS__)
 82
 83struct hfi1_user_sdma_pkt_q {
 84	u16 ctxt;
 85	u16 subctxt;
 86	u16 n_max_reqs;
 87	atomic_t n_reqs;
 88	u16 reqidx;
 89	struct hfi1_devdata *dd;
 90	struct kmem_cache *txreq_cache;
 91	struct user_sdma_request *reqs;
 92	unsigned long *req_in_use;
 93	struct iowait busy;
 94	enum pkt_q_sdma_state state;
 95	wait_queue_head_t wait;
 96	unsigned long unpinned;
 97	struct mmu_rb_handler *handler;
 98	atomic_t n_locked;
 
 99};
100
101struct hfi1_user_sdma_comp_q {
102	u16 nentries;
103	struct hfi1_sdma_comp_entry *comps;
104};
105
 
 
 
 
 
 
 
 
106struct user_sdma_iovec {
107	struct list_head list;
108	struct iovec iov;
 
 
 
 
109	/*
110	 * offset into the virtual address space of the vector at
111	 * which we last left off.
112	 */
113	u64 offset;
 
114};
115
116/* evict operation argument */
117struct evict_data {
118	u32 cleared;	/* count evicted so far */
119	u32 target;	/* target count to evict */
120};
121
122struct user_sdma_request {
123	/* This is the original header from user space */
124	struct hfi1_pkt_header hdr;
125
126	/* Read mostly fields */
127	struct hfi1_user_sdma_pkt_q *pq ____cacheline_aligned_in_smp;
128	struct hfi1_user_sdma_comp_q *cq;
129	/*
130	 * Pointer to the SDMA engine for this request.
131	 * Since different request could be on different VLs,
132	 * each request will need it's own engine pointer.
133	 */
134	struct sdma_engine *sde;
135	struct sdma_req_info info;
136	/* TID array values copied from the tid_iov vector */
137	u32 *tids;
138	/* total length of the data in the request */
139	u32 data_len;
140	/* number of elements copied to the tids array */
141	u16 n_tids;
142	/*
143	 * We copy the iovs for this request (based on
144	 * info.iovcnt). These are only the data vectors
145	 */
146	u8 data_iovs;
147	s8 ahg_idx;
148
149	/* Writeable fields shared with interrupt */
150	u16 seqcomp ____cacheline_aligned_in_smp;
151	u16 seqsubmitted;
152
153	/* Send side fields */
154	struct list_head txps ____cacheline_aligned_in_smp;
155	u16 seqnum;
156	/*
157	 * KDETH.OFFSET (TID) field
158	 * The offset can cover multiple packets, depending on the
159	 * size of the TID entry.
160	 */
161	u32 tidoffset;
162	/*
163	 * KDETH.Offset (Eager) field
164	 * We need to remember the initial value so the headers
165	 * can be updated properly.
166	 */
167	u32 koffset;
168	u32 sent;
169	/* TID index copied from the tid_iov vector */
170	u16 tididx;
171	/* progress index moving along the iovs array */
172	u8 iov_idx;
173	u8 has_error;
174
175	struct user_sdma_iovec iovs[MAX_VECTORS_PER_REQ];
176} ____cacheline_aligned_in_smp;
177
178/*
179 * A single txreq could span up to 3 physical pages when the MTU
180 * is sufficiently large (> 4K). Each of the IOV pointers also
181 * needs it's own set of flags so the vector has been handled
182 * independently of each other.
183 */
184struct user_sdma_txreq {
185	/* Packet header for the txreq */
186	struct hfi1_pkt_header hdr;
187	struct sdma_txreq txreq;
188	struct list_head list;
189	struct user_sdma_request *req;
190	u16 flags;
191	u16 seqnum;
192};
193
194int hfi1_user_sdma_alloc_queues(struct hfi1_ctxtdata *uctxt,
195				struct hfi1_filedata *fd);
196int hfi1_user_sdma_free_queues(struct hfi1_filedata *fd,
197			       struct hfi1_ctxtdata *uctxt);
198int hfi1_user_sdma_process_request(struct hfi1_filedata *fd,
199				   struct iovec *iovec, unsigned long dim,
200				   unsigned long *count);
 
201#endif /* _HFI1_USER_SDMA_H */
v5.4
  1#ifndef _HFI1_USER_SDMA_H
  2#define _HFI1_USER_SDMA_H
  3/*
 
  4 * Copyright(c) 2015 - 2018 Intel Corporation.
  5 *
  6 * This file is provided under a dual BSD/GPLv2 license.  When using or
  7 * redistributing this file, you may do so under either license.
  8 *
  9 * GPL LICENSE SUMMARY
 10 *
 11 * This program is free software; you can redistribute it and/or modify
 12 * it under the terms of version 2 of the GNU General Public License as
 13 * published by the Free Software Foundation.
 14 *
 15 * This program is distributed in the hope that it will be useful, but
 16 * WITHOUT ANY WARRANTY; without even the implied warranty of
 17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 18 * General Public License for more details.
 19 *
 20 * BSD LICENSE
 21 *
 22 * Redistribution and use in source and binary forms, with or without
 23 * modification, are permitted provided that the following conditions
 24 * are met:
 25 *
 26 *  - Redistributions of source code must retain the above copyright
 27 *    notice, this list of conditions and the following disclaimer.
 28 *  - Redistributions in binary form must reproduce the above copyright
 29 *    notice, this list of conditions and the following disclaimer in
 30 *    the documentation and/or other materials provided with the
 31 *    distribution.
 32 *  - Neither the name of Intel Corporation nor the names of its
 33 *    contributors may be used to endorse or promote products derived
 34 *    from this software without specific prior written permission.
 35 *
 36 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 37 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 38 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 39 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 40 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 41 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 42 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 43 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 44 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 45 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 46 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 47 *
 48 */
 
 
 
 49#include <linux/device.h>
 50#include <linux/wait.h>
 51
 52#include "common.h"
 53#include "iowait.h"
 54#include "user_exp_rcv.h"
 
 
 
 55
 56/* The maximum number of Data io vectors per message/request */
 57#define MAX_VECTORS_PER_REQ 8
 58/*
 59 * Maximum number of packet to send from each message/request
 60 * before moving to the next one.
 61 */
 62#define MAX_PKTS_PER_QUEUE 16
 63
 64#define num_pages(x) (1 + ((((x) - 1) & PAGE_MASK) >> PAGE_SHIFT))
 65
 66#define req_opcode(x) \
 67	(((x) >> HFI1_SDMA_REQ_OPCODE_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK)
 68#define req_version(x) \
 69	(((x) >> HFI1_SDMA_REQ_VERSION_SHIFT) & HFI1_SDMA_REQ_OPCODE_MASK)
 70#define req_iovcnt(x) \
 71	(((x) >> HFI1_SDMA_REQ_IOVCNT_SHIFT) & HFI1_SDMA_REQ_IOVCNT_MASK)
 72
 73/* Number of BTH.PSN bits used for sequence number in expected rcvs */
 74#define BTH_SEQ_MASK 0x7ffull
 75
 76#define AHG_KDETH_INTR_SHIFT 12
 77#define AHG_KDETH_SH_SHIFT   13
 78#define AHG_KDETH_ARRAY_SIZE  9
 79
 80#define PBC2LRH(x) ((((x) & 0xfff) << 2) - 4)
 81#define LRH2PBC(x) ((((x) >> 2) + 1) & 0xfff)
 82
 83/**
 84 * Build an SDMA AHG header update descriptor and save it to an array.
 85 * @arr        - Array to save the descriptor to.
 86 * @idx        - Index of the array at which the descriptor will be saved.
 87 * @array_size - Size of the array arr.
 88 * @dw         - Update index into the header in DWs.
 89 * @bit        - Start bit.
 90 * @width      - Field width.
 91 * @value      - 16 bits of immediate data to write into the field.
 92 * Returns -ERANGE if idx is invalid. If successful, returns the next index
 93 * (idx + 1) of the array to be used for the next descriptor.
 94 */
 95static inline int ahg_header_set(u32 *arr, int idx, size_t array_size,
 96				 u8 dw, u8 bit, u8 width, u16 value)
 97{
 98	if ((size_t)idx >= array_size)
 99		return -ERANGE;
100	arr[idx++] = sdma_build_ahg_descriptor(value, dw, bit, width);
101	return idx;
102}
103
104/* Tx request flag bits */
105#define TXREQ_FLAGS_REQ_ACK   BIT(0)      /* Set the ACK bit in the header */
106#define TXREQ_FLAGS_REQ_DISABLE_SH BIT(1) /* Disable header suppression */
107
108enum pkt_q_sdma_state {
109	SDMA_PKT_Q_ACTIVE,
110	SDMA_PKT_Q_DEFERRED,
111};
112
113#define SDMA_IOWAIT_TIMEOUT 1000 /* in milliseconds */
114
115#define SDMA_DBG(req, fmt, ...)				     \
116	hfi1_cdbg(SDMA, "[%u:%u:%u:%u] " fmt, (req)->pq->dd->unit, \
117		 (req)->pq->ctxt, (req)->pq->subctxt, (req)->info.comp_idx, \
118		 ##__VA_ARGS__)
119
120struct hfi1_user_sdma_pkt_q {
121	u16 ctxt;
122	u16 subctxt;
123	u16 n_max_reqs;
124	atomic_t n_reqs;
125	u16 reqidx;
126	struct hfi1_devdata *dd;
127	struct kmem_cache *txreq_cache;
128	struct user_sdma_request *reqs;
129	unsigned long *req_in_use;
130	struct iowait busy;
131	enum pkt_q_sdma_state state;
132	wait_queue_head_t wait;
133	unsigned long unpinned;
134	struct mmu_rb_handler *handler;
135	atomic_t n_locked;
136	struct mm_struct *mm;
137};
138
139struct hfi1_user_sdma_comp_q {
140	u16 nentries;
141	struct hfi1_sdma_comp_entry *comps;
142};
143
144struct sdma_mmu_node {
145	struct mmu_rb_node rb;
146	struct hfi1_user_sdma_pkt_q *pq;
147	atomic_t refcount;
148	struct page **pages;
149	unsigned int npages;
150};
151
152struct user_sdma_iovec {
153	struct list_head list;
154	struct iovec iov;
155	/* number of pages in this vector */
156	unsigned int npages;
157	/* array of pinned pages for this vector */
158	struct page **pages;
159	/*
160	 * offset into the virtual address space of the vector at
161	 * which we last left off.
162	 */
163	u64 offset;
164	struct sdma_mmu_node *node;
165};
166
167/* evict operation argument */
168struct evict_data {
169	u32 cleared;	/* count evicted so far */
170	u32 target;	/* target count to evict */
171};
172
173struct user_sdma_request {
174	/* This is the original header from user space */
175	struct hfi1_pkt_header hdr;
176
177	/* Read mostly fields */
178	struct hfi1_user_sdma_pkt_q *pq ____cacheline_aligned_in_smp;
179	struct hfi1_user_sdma_comp_q *cq;
180	/*
181	 * Pointer to the SDMA engine for this request.
182	 * Since different request could be on different VLs,
183	 * each request will need it's own engine pointer.
184	 */
185	struct sdma_engine *sde;
186	struct sdma_req_info info;
187	/* TID array values copied from the tid_iov vector */
188	u32 *tids;
189	/* total length of the data in the request */
190	u32 data_len;
191	/* number of elements copied to the tids array */
192	u16 n_tids;
193	/*
194	 * We copy the iovs for this request (based on
195	 * info.iovcnt). These are only the data vectors
196	 */
197	u8 data_iovs;
198	s8 ahg_idx;
199
200	/* Writeable fields shared with interrupt */
201	u16 seqcomp ____cacheline_aligned_in_smp;
202	u16 seqsubmitted;
203
204	/* Send side fields */
205	struct list_head txps ____cacheline_aligned_in_smp;
206	u16 seqnum;
207	/*
208	 * KDETH.OFFSET (TID) field
209	 * The offset can cover multiple packets, depending on the
210	 * size of the TID entry.
211	 */
212	u32 tidoffset;
213	/*
214	 * KDETH.Offset (Eager) field
215	 * We need to remember the initial value so the headers
216	 * can be updated properly.
217	 */
218	u32 koffset;
219	u32 sent;
220	/* TID index copied from the tid_iov vector */
221	u16 tididx;
222	/* progress index moving along the iovs array */
223	u8 iov_idx;
224	u8 has_error;
225
226	struct user_sdma_iovec iovs[MAX_VECTORS_PER_REQ];
227} ____cacheline_aligned_in_smp;
228
229/*
230 * A single txreq could span up to 3 physical pages when the MTU
231 * is sufficiently large (> 4K). Each of the IOV pointers also
232 * needs it's own set of flags so the vector has been handled
233 * independently of each other.
234 */
235struct user_sdma_txreq {
236	/* Packet header for the txreq */
237	struct hfi1_pkt_header hdr;
238	struct sdma_txreq txreq;
239	struct list_head list;
240	struct user_sdma_request *req;
241	u16 flags;
242	u16 seqnum;
243};
244
245int hfi1_user_sdma_alloc_queues(struct hfi1_ctxtdata *uctxt,
246				struct hfi1_filedata *fd);
247int hfi1_user_sdma_free_queues(struct hfi1_filedata *fd,
248			       struct hfi1_ctxtdata *uctxt);
249int hfi1_user_sdma_process_request(struct hfi1_filedata *fd,
250				   struct iovec *iovec, unsigned long dim,
251				   unsigned long *count);
252
253#endif /* _HFI1_USER_SDMA_H */