Linux Audio

Check our new training course

Loading...
v6.2
  1/*
  2 * Copyright 2014 Advanced Micro Devices, Inc.
  3 *
  4 * Permission is hereby granted, free of charge, to any person obtaining a
  5 * copy of this software and associated documentation files (the "Software"),
  6 * to deal in the Software without restriction, including without limitation
  7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8 * and/or sell copies of the Software, and to permit persons to whom the
  9 * Software is furnished to do so, subject to the following conditions:
 10 *
 11 * The above copyright notice and this permission notice shall be included in
 12 * all copies or substantial portions of the Software.
 13 *
 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 20 * OTHER DEALINGS IN THE SOFTWARE.
 21 *
 22 */
 23
 24#include <linux/dma-mapping.h>
 25
 26#include "amdgpu.h"
 27#include "amdgpu_ih.h"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 28
 29/**
 30 * amdgpu_ih_ring_init - initialize the IH state
 31 *
 32 * @adev: amdgpu_device pointer
 33 * @ih: ih ring to initialize
 34 * @ring_size: ring size to allocate
 35 * @use_bus_addr: true when we can use dma_alloc_coherent
 36 *
 37 * Initializes the IH state and allocates a buffer
 38 * for the IH ring buffer.
 39 * Returns 0 for success, errors for failure.
 40 */
 41int amdgpu_ih_ring_init(struct amdgpu_device *adev, struct amdgpu_ih_ring *ih,
 42			unsigned ring_size, bool use_bus_addr)
 43{
 44	u32 rb_bufsz;
 45	int r;
 46
 47	/* Align ring size */
 48	rb_bufsz = order_base_2(ring_size / 4);
 49	ring_size = (1 << rb_bufsz) * 4;
 50	ih->ring_size = ring_size;
 51	ih->ptr_mask = ih->ring_size - 1;
 52	ih->rptr = 0;
 53	ih->use_bus_addr = use_bus_addr;
 54
 55	if (use_bus_addr) {
 56		dma_addr_t dma_addr;
 57
 58		if (ih->ring)
 59			return 0;
 60
 61		/* add 8 bytes for the rptr/wptr shadows and
 62		 * add them to the end of the ring allocation.
 63		 */
 64		ih->ring = dma_alloc_coherent(adev->dev, ih->ring_size + 8,
 65					      &dma_addr, GFP_KERNEL);
 66		if (ih->ring == NULL)
 67			return -ENOMEM;
 68
 69		ih->gpu_addr = dma_addr;
 70		ih->wptr_addr = dma_addr + ih->ring_size;
 71		ih->wptr_cpu = &ih->ring[ih->ring_size / 4];
 72		ih->rptr_addr = dma_addr + ih->ring_size + 4;
 73		ih->rptr_cpu = &ih->ring[(ih->ring_size / 4) + 1];
 74	} else {
 75		unsigned wptr_offs, rptr_offs;
 76
 77		r = amdgpu_device_wb_get(adev, &wptr_offs);
 78		if (r)
 79			return r;
 80
 81		r = amdgpu_device_wb_get(adev, &rptr_offs);
 82		if (r) {
 83			amdgpu_device_wb_free(adev, wptr_offs);
 84			return r;
 85		}
 86
 87		r = amdgpu_bo_create_kernel(adev, ih->ring_size, PAGE_SIZE,
 88					    AMDGPU_GEM_DOMAIN_GTT,
 89					    &ih->ring_obj, &ih->gpu_addr,
 90					    (void **)&ih->ring);
 91		if (r) {
 92			amdgpu_device_wb_free(adev, rptr_offs);
 93			amdgpu_device_wb_free(adev, wptr_offs);
 94			return r;
 95		}
 96
 97		ih->wptr_addr = adev->wb.gpu_addr + wptr_offs * 4;
 98		ih->wptr_cpu = &adev->wb.wb[wptr_offs];
 99		ih->rptr_addr = adev->wb.gpu_addr + rptr_offs * 4;
100		ih->rptr_cpu = &adev->wb.wb[rptr_offs];
101	}
102
103	init_waitqueue_head(&ih->wait_process);
104	return 0;
105}
106
107/**
108 * amdgpu_ih_ring_fini - tear down the IH state
109 *
110 * @adev: amdgpu_device pointer
111 * @ih: ih ring to tear down
112 *
113 * Tears down the IH state and frees buffer
114 * used for the IH ring buffer.
115 */
116void amdgpu_ih_ring_fini(struct amdgpu_device *adev, struct amdgpu_ih_ring *ih)
117{
118
119	if (!ih->ring)
120		return;
121
122	if (ih->use_bus_addr) {
123
124		/* add 8 bytes for the rptr/wptr shadows and
125		 * add them to the end of the ring allocation.
126		 */
127		dma_free_coherent(adev->dev, ih->ring_size + 8,
128				  (void *)ih->ring, ih->gpu_addr);
129		ih->ring = NULL;
130	} else {
131		amdgpu_bo_free_kernel(&ih->ring_obj, &ih->gpu_addr,
132				      (void **)&ih->ring);
133		amdgpu_device_wb_free(adev, (ih->wptr_addr - ih->gpu_addr) / 4);
134		amdgpu_device_wb_free(adev, (ih->rptr_addr - ih->gpu_addr) / 4);
 
135	}
136}
137
138/**
139 * amdgpu_ih_ring_write - write IV to the ring buffer
140 *
141 * @ih: ih ring to write to
142 * @iv: the iv to write
143 * @num_dw: size of the iv in dw
144 *
145 * Writes an IV to the ring buffer using the CPU and increment the wptr.
146 * Used for testing and delegating IVs to a software ring.
147 */
148void amdgpu_ih_ring_write(struct amdgpu_ih_ring *ih, const uint32_t *iv,
149			  unsigned int num_dw)
150{
151	uint32_t wptr = le32_to_cpu(*ih->wptr_cpu) >> 2;
152	unsigned int i;
153
154	for (i = 0; i < num_dw; ++i)
155	        ih->ring[wptr++] = cpu_to_le32(iv[i]);
156
157	wptr <<= 2;
158	wptr &= ih->ptr_mask;
159
160	/* Only commit the new wptr if we don't overflow */
161	if (wptr != READ_ONCE(ih->rptr)) {
162		wmb();
163		WRITE_ONCE(*ih->wptr_cpu, cpu_to_le32(wptr));
164	}
165}
166
167/**
168 * amdgpu_ih_wait_on_checkpoint_process_ts - wait to process IVs up to checkpoint
169 *
170 * @adev: amdgpu_device pointer
171 * @ih: ih ring to process
172 *
173 * Used to ensure ring has processed IVs up to the checkpoint write pointer.
174 */
175int amdgpu_ih_wait_on_checkpoint_process_ts(struct amdgpu_device *adev,
176					struct amdgpu_ih_ring *ih)
177{
178	uint32_t checkpoint_wptr;
179	uint64_t checkpoint_ts;
180	long timeout = HZ;
181
182	if (!ih->enabled || adev->shutdown)
183		return -ENODEV;
184
185	checkpoint_wptr = amdgpu_ih_get_wptr(adev, ih);
186	/* Order wptr with ring data. */
187	rmb();
188	checkpoint_ts = amdgpu_ih_decode_iv_ts(adev, ih, checkpoint_wptr, -1);
189
190	return wait_event_interruptible_timeout(ih->wait_process,
191		    amdgpu_ih_ts_after(checkpoint_ts, ih->processed_timestamp) ||
192		    ih->rptr == amdgpu_ih_get_wptr(adev, ih), timeout);
193}
194
195/**
196 * amdgpu_ih_process - interrupt handler
197 *
198 * @adev: amdgpu_device pointer
199 * @ih: ih ring to process
200 *
201 * Interrupt hander (VI), walk the IH ring.
202 * Returns irq process return code.
203 */
204int amdgpu_ih_process(struct amdgpu_device *adev, struct amdgpu_ih_ring *ih)
205{
206	unsigned int count;
207	u32 wptr;
208
209	if (!ih->enabled || adev->shutdown)
210		return IRQ_NONE;
211
212	wptr = amdgpu_ih_get_wptr(adev, ih);
213
214restart_ih:
215	count  = AMDGPU_IH_MAX_NUM_IVS;
216	DRM_DEBUG("%s: rptr %d, wptr %d\n", __func__, ih->rptr, wptr);
 
 
 
217
218	/* Order reading of wptr vs. reading of IH ring data */
219	rmb();
220
221	while (ih->rptr != wptr && --count) {
222		amdgpu_irq_dispatch(adev, ih);
223		ih->rptr &= ih->ptr_mask;
224	}
225
226	amdgpu_ih_set_rptr(adev, ih);
227	wake_up_all(&ih->wait_process);
 
 
 
 
 
 
 
 
 
 
 
228
229	/* make sure wptr hasn't changed while processing */
230	wptr = amdgpu_ih_get_wptr(adev, ih);
231	if (wptr != ih->rptr)
232		goto restart_ih;
233
234	return IRQ_HANDLED;
235}
236
237/**
238 * amdgpu_ih_decode_iv_helper - decode an interrupt vector
239 *
240 * @adev: amdgpu_device pointer
241 * @ih: ih ring to process
242 * @entry: IV entry
243 *
244 * Decodes the interrupt vector at the current rptr
245 * position and also advance the position for Vega10
246 * and later GPUs.
247 */
248void amdgpu_ih_decode_iv_helper(struct amdgpu_device *adev,
249				struct amdgpu_ih_ring *ih,
250				struct amdgpu_iv_entry *entry)
251{
252	/* wptr/rptr are in bytes! */
253	u32 ring_index = ih->rptr >> 2;
254	uint32_t dw[8];
255
256	dw[0] = le32_to_cpu(ih->ring[ring_index + 0]);
257	dw[1] = le32_to_cpu(ih->ring[ring_index + 1]);
258	dw[2] = le32_to_cpu(ih->ring[ring_index + 2]);
259	dw[3] = le32_to_cpu(ih->ring[ring_index + 3]);
260	dw[4] = le32_to_cpu(ih->ring[ring_index + 4]);
261	dw[5] = le32_to_cpu(ih->ring[ring_index + 5]);
262	dw[6] = le32_to_cpu(ih->ring[ring_index + 6]);
263	dw[7] = le32_to_cpu(ih->ring[ring_index + 7]);
264
265	entry->client_id = dw[0] & 0xff;
266	entry->src_id = (dw[0] >> 8) & 0xff;
267	entry->ring_id = (dw[0] >> 16) & 0xff;
268	entry->vmid = (dw[0] >> 24) & 0xf;
269	entry->vmid_src = (dw[0] >> 31);
270	entry->timestamp = dw[1] | ((u64)(dw[2] & 0xffff) << 32);
271	entry->timestamp_src = dw[2] >> 31;
272	entry->pasid = dw[3] & 0xffff;
273	entry->pasid_src = dw[3] >> 31;
274	entry->src_data[0] = dw[4];
275	entry->src_data[1] = dw[5];
276	entry->src_data[2] = dw[6];
277	entry->src_data[3] = dw[7];
278
279	/* wptr/rptr are in bytes! */
280	ih->rptr += 32;
281}
282
283uint64_t amdgpu_ih_decode_iv_ts_helper(struct amdgpu_ih_ring *ih, u32 rptr,
284				       signed int offset)
285{
286	uint32_t iv_size = 32;
287	uint32_t ring_index;
288	uint32_t dw1, dw2;
289
290	rptr += iv_size * offset;
291	ring_index = (rptr & ih->ptr_mask) >> 2;
292
293	dw1 = le32_to_cpu(ih->ring[ring_index + 1]);
294	dw2 = le32_to_cpu(ih->ring[ring_index + 2]);
295	return dw1 | ((u64)(dw2 & 0xffff) << 32);
296}
v4.10.11
  1/*
  2 * Copyright 2014 Advanced Micro Devices, Inc.
  3 *
  4 * Permission is hereby granted, free of charge, to any person obtaining a
  5 * copy of this software and associated documentation files (the "Software"),
  6 * to deal in the Software without restriction, including without limitation
  7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8 * and/or sell copies of the Software, and to permit persons to whom the
  9 * Software is furnished to do so, subject to the following conditions:
 10 *
 11 * The above copyright notice and this permission notice shall be included in
 12 * all copies or substantial portions of the Software.
 13 *
 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 20 * OTHER DEALINGS IN THE SOFTWARE.
 21 *
 22 */
 23
 24#include <drm/drmP.h>
 
 25#include "amdgpu.h"
 26#include "amdgpu_ih.h"
 27#include "amdgpu_amdkfd.h"
 28
 29/**
 30 * amdgpu_ih_ring_alloc - allocate memory for the IH ring
 31 *
 32 * @adev: amdgpu_device pointer
 33 *
 34 * Allocate a ring buffer for the interrupt controller.
 35 * Returns 0 for success, errors for failure.
 36 */
 37static int amdgpu_ih_ring_alloc(struct amdgpu_device *adev)
 38{
 39	int r;
 40
 41	/* Allocate ring buffer */
 42	if (adev->irq.ih.ring_obj == NULL) {
 43		r = amdgpu_bo_create_kernel(adev, adev->irq.ih.ring_size,
 44					    PAGE_SIZE, AMDGPU_GEM_DOMAIN_GTT,
 45					    &adev->irq.ih.ring_obj,
 46					    &adev->irq.ih.gpu_addr,
 47					    (void **)&adev->irq.ih.ring);
 48		if (r) {
 49			DRM_ERROR("amdgpu: failed to create ih ring buffer (%d).\n", r);
 50			return r;
 51		}
 52	}
 53	return 0;
 54}
 55
 56/**
 57 * amdgpu_ih_ring_init - initialize the IH state
 58 *
 59 * @adev: amdgpu_device pointer
 
 
 
 60 *
 61 * Initializes the IH state and allocates a buffer
 62 * for the IH ring buffer.
 63 * Returns 0 for success, errors for failure.
 64 */
 65int amdgpu_ih_ring_init(struct amdgpu_device *adev, unsigned ring_size,
 66			bool use_bus_addr)
 67{
 68	u32 rb_bufsz;
 69	int r;
 70
 71	/* Align ring size */
 72	rb_bufsz = order_base_2(ring_size / 4);
 73	ring_size = (1 << rb_bufsz) * 4;
 74	adev->irq.ih.ring_size = ring_size;
 75	adev->irq.ih.ptr_mask = adev->irq.ih.ring_size - 1;
 76	adev->irq.ih.rptr = 0;
 77	adev->irq.ih.use_bus_addr = use_bus_addr;
 78
 79	if (adev->irq.ih.use_bus_addr) {
 80		if (!adev->irq.ih.ring) {
 81			/* add 8 bytes for the rptr/wptr shadows and
 82			 * add them to the end of the ring allocation.
 83			 */
 84			adev->irq.ih.ring = pci_alloc_consistent(adev->pdev,
 85								 adev->irq.ih.ring_size + 8,
 86								 &adev->irq.ih.rb_dma_addr);
 87			if (adev->irq.ih.ring == NULL)
 88				return -ENOMEM;
 89			memset((void *)adev->irq.ih.ring, 0, adev->irq.ih.ring_size + 8);
 90			adev->irq.ih.wptr_offs = (adev->irq.ih.ring_size / 4) + 0;
 91			adev->irq.ih.rptr_offs = (adev->irq.ih.ring_size / 4) + 1;
 92		}
 93		return 0;
 
 
 
 
 94	} else {
 95		r = amdgpu_wb_get(adev, &adev->irq.ih.wptr_offs);
 
 
 
 
 
 
 96		if (r) {
 97			dev_err(adev->dev, "(%d) ih wptr_offs wb alloc failed\n", r);
 98			return r;
 99		}
100
101		r = amdgpu_wb_get(adev, &adev->irq.ih.rptr_offs);
 
 
 
102		if (r) {
103			amdgpu_wb_free(adev, adev->irq.ih.wptr_offs);
104			dev_err(adev->dev, "(%d) ih rptr_offs wb alloc failed\n", r);
105			return r;
106		}
107
108		return amdgpu_ih_ring_alloc(adev);
 
 
 
109	}
 
 
 
110}
111
112/**
113 * amdgpu_ih_ring_fini - tear down the IH state
114 *
115 * @adev: amdgpu_device pointer
 
116 *
117 * Tears down the IH state and frees buffer
118 * used for the IH ring buffer.
119 */
120void amdgpu_ih_ring_fini(struct amdgpu_device *adev)
121{
122	if (adev->irq.ih.use_bus_addr) {
123		if (adev->irq.ih.ring) {
124			/* add 8 bytes for the rptr/wptr shadows and
125			 * add them to the end of the ring allocation.
126			 */
127			pci_free_consistent(adev->pdev, adev->irq.ih.ring_size + 8,
128					    (void *)adev->irq.ih.ring,
129					    adev->irq.ih.rb_dma_addr);
130			adev->irq.ih.ring = NULL;
131		}
 
 
132	} else {
133		amdgpu_bo_free_kernel(&adev->irq.ih.ring_obj,
134				      &adev->irq.ih.gpu_addr,
135				      (void **)&adev->irq.ih.ring);
136		amdgpu_wb_free(adev, adev->irq.ih.wptr_offs);
137		amdgpu_wb_free(adev, adev->irq.ih.rptr_offs);
138	}
139}
140
141/**
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
142 * amdgpu_ih_process - interrupt handler
143 *
144 * @adev: amdgpu_device pointer
 
145 *
146 * Interrupt hander (VI), walk the IH ring.
147 * Returns irq process return code.
148 */
149int amdgpu_ih_process(struct amdgpu_device *adev)
150{
151	struct amdgpu_iv_entry entry;
152	u32 wptr;
153
154	if (!adev->irq.ih.enabled || adev->shutdown)
155		return IRQ_NONE;
156
157	wptr = amdgpu_ih_get_wptr(adev);
158
159restart_ih:
160	/* is somebody else already processing irqs? */
161	if (atomic_xchg(&adev->irq.ih.lock, 1))
162		return IRQ_NONE;
163
164	DRM_DEBUG("%s: rptr %d, wptr %d\n", __func__, adev->irq.ih.rptr, wptr);
165
166	/* Order reading of wptr vs. reading of IH ring data */
167	rmb();
168
169	while (adev->irq.ih.rptr != wptr) {
170		u32 ring_index = adev->irq.ih.rptr >> 2;
 
 
171
172		/* Before dispatching irq to IP blocks, send it to amdkfd */
173		amdgpu_amdkfd_interrupt(adev,
174				(const void *) &adev->irq.ih.ring[ring_index]);
175
176		entry.iv_entry = (const uint32_t *)
177			&adev->irq.ih.ring[ring_index];
178		amdgpu_ih_decode_iv(adev, &entry);
179		adev->irq.ih.rptr &= adev->irq.ih.ptr_mask;
180
181		amdgpu_irq_dispatch(adev, &entry);
182	}
183	amdgpu_ih_set_rptr(adev);
184	atomic_set(&adev->irq.ih.lock, 0);
185
186	/* make sure wptr hasn't changed while processing */
187	wptr = amdgpu_ih_get_wptr(adev);
188	if (wptr != adev->irq.ih.rptr)
189		goto restart_ih;
190
191	return IRQ_HANDLED;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
192}