amdgpu_ctx.c - drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c - Linux diff v5.9

  1/*
  2 * Copyright 2015 Advanced Micro Devices, Inc.
  3 *
  4 * Permission is hereby granted, free of charge, to any person obtaining a
  5 * copy of this software and associated documentation files (the "Software"),
  6 * to deal in the Software without restriction, including without limitation
  7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8 * and/or sell copies of the Software, and to permit persons to whom the
  9 * Software is furnished to do so, subject to the following conditions:
 10 *
 11 * The above copyright notice and this permission notice shall be included in
 12 * all copies or substantial portions of the Software.
 13 *
 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 20 * OTHER DEALINGS IN THE SOFTWARE.
 21 *
 22 * Authors: monk liu <monk.liu@amd.com>
 23 */
 24
 
 25#include <drm/drm_auth.h>
 26#include "amdgpu.h"
 27#include "amdgpu_sched.h"
 28#include "amdgpu_ras.h"
 29#include <linux/nospec.h>
 30
 31#define to_amdgpu_ctx_entity(e)	\
 32	container_of((e), struct amdgpu_ctx_entity, entity)
 33
 34const unsigned int amdgpu_ctx_num_entities[AMDGPU_HW_IP_NUM] = {
 35	[AMDGPU_HW_IP_GFX]	=	1,
 36	[AMDGPU_HW_IP_COMPUTE]	=	4,
 37	[AMDGPU_HW_IP_DMA]	=	2,
 38	[AMDGPU_HW_IP_UVD]	=	1,
 39	[AMDGPU_HW_IP_VCE]	=	1,
 40	[AMDGPU_HW_IP_UVD_ENC]	=	1,
 41	[AMDGPU_HW_IP_VCN_DEC]	=	1,
 42	[AMDGPU_HW_IP_VCN_ENC]	=	1,
 43	[AMDGPU_HW_IP_VCN_JPEG]	=	1,
 44};
 45
 46static int amdgpu_ctx_priority_permit(struct drm_file *filp,
 47				      enum drm_sched_priority priority)
 48{
 49	if (priority < 0 || priority >= DRM_SCHED_PRIORITY_MAX)
 50		return -EINVAL;
 51
 52	/* NORMAL and below are accessible by everyone */
 53	if (priority <= DRM_SCHED_PRIORITY_NORMAL)
 54		return 0;
 55
 56	if (capable(CAP_SYS_NICE))
 57		return 0;
 58
 59	if (drm_is_current_master(filp))
 60		return 0;
 61
 62	return -EACCES;
 63}
 64
 65static enum gfx_pipe_priority amdgpu_ctx_sched_prio_to_compute_prio(enum drm_sched_priority prio)
 66{
 67	switch (prio) {
 68	case DRM_SCHED_PRIORITY_HIGH_HW:
 69	case DRM_SCHED_PRIORITY_KERNEL:
 70		return AMDGPU_GFX_PIPE_PRIO_HIGH;
 71	default:
 72		return AMDGPU_GFX_PIPE_PRIO_NORMAL;
 73	}
 74}
 75
 76static unsigned int amdgpu_ctx_prio_sched_to_hw(struct amdgpu_device *adev,
 77						 enum drm_sched_priority prio,
 78						 u32 hw_ip)
 79{
 80	unsigned int hw_prio;
 81
 82	hw_prio = (hw_ip == AMDGPU_HW_IP_COMPUTE) ?
 83			amdgpu_ctx_sched_prio_to_compute_prio(prio) :
 84			AMDGPU_RING_PRIO_DEFAULT;
 85	hw_ip = array_index_nospec(hw_ip, AMDGPU_HW_IP_NUM);
 86	if (adev->gpu_sched[hw_ip][hw_prio].num_scheds == 0)
 87		hw_prio = AMDGPU_RING_PRIO_DEFAULT;
 88
 89	return hw_prio;
 90}
 91
 92static int amdgpu_ctx_init_entity(struct amdgpu_ctx *ctx, u32 hw_ip,
 93				   const u32 ring)
 94{
 95	struct amdgpu_device *adev = ctx->adev;
 96	struct amdgpu_ctx_entity *entity;
 97	struct drm_gpu_scheduler **scheds = NULL, *sched = NULL;
 98	unsigned num_scheds = 0;
 99	unsigned int hw_prio;
100	enum drm_sched_priority priority;
101	int r;
102
103	entity = kcalloc(1, offsetof(typeof(*entity), fences[amdgpu_sched_jobs]),
104			 GFP_KERNEL);
105	if (!entity)
106		return  -ENOMEM;
107
108	entity->sequence = 1;
109	priority = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
110				ctx->init_priority : ctx->override_priority;
111	hw_prio = amdgpu_ctx_prio_sched_to_hw(adev, priority, hw_ip);
112
113	hw_ip = array_index_nospec(hw_ip, AMDGPU_HW_IP_NUM);
114	scheds = adev->gpu_sched[hw_ip][hw_prio].sched;
115	num_scheds = adev->gpu_sched[hw_ip][hw_prio].num_scheds;
116
117	if (hw_ip == AMDGPU_HW_IP_VCN_ENC || hw_ip == AMDGPU_HW_IP_VCN_DEC) {
118		sched = drm_sched_pick_best(scheds, num_scheds);
119		scheds = &sched;
120		num_scheds = 1;
121	}
122
123	r = drm_sched_entity_init(&entity->entity, priority, scheds, num_scheds,
124				  &ctx->guilty);
125	if (r)
126		goto error_free_entity;
127
128	ctx->entities[hw_ip][ring] = entity;
129	return 0;
130
131error_free_entity:
132	kfree(entity);
133
134	return r;
135}
136
137static int amdgpu_ctx_init(struct amdgpu_device *adev,
138			   enum drm_sched_priority priority,
139			   struct drm_file *filp,
140			   struct amdgpu_ctx *ctx)
141{
 
142	int r;
143
 
 
 
144	r = amdgpu_ctx_priority_permit(filp, priority);
145	if (r)
146		return r;
147
148	memset(ctx, 0, sizeof(*ctx));
149
150	ctx->adev = adev;
151
152	kref_init(&ctx->refcount);
153	spin_lock_init(&ctx->ring_lock);
 
 
 
 
 
154	mutex_init(&ctx->lock);
155
 
 
 
 
 
156	ctx->reset_counter = atomic_read(&adev->gpu_reset_counter);
157	ctx->reset_counter_query = ctx->reset_counter;
158	ctx->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
159	ctx->init_priority = priority;
160	ctx->override_priority = DRM_SCHED_PRIORITY_UNSET;
161
162	return 0;
163}
 
 
164
165static void amdgpu_ctx_fini_entity(struct amdgpu_ctx_entity *entity)
166{
167
168	int i;
 
169
170	if (!entity)
171		return;
 
 
 
 
 
 
 
172
173	for (i = 0; i < amdgpu_sched_jobs; ++i)
174		dma_fence_put(entity->fences[i]);
175
176	kfree(entity);
 
 
 
 
 
 
177}
178
179static void amdgpu_ctx_fini(struct kref *ref)
180{
181	struct amdgpu_ctx *ctx = container_of(ref, struct amdgpu_ctx, refcount);
182	struct amdgpu_device *adev = ctx->adev;
183	unsigned i, j;
184
185	if (!adev)
186		return;
187
188	for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
189		for (j = 0; j < AMDGPU_MAX_ENTITY_NUM; ++j) {
190			amdgpu_ctx_fini_entity(ctx->entities[i][j]);
191			ctx->entities[i][j] = NULL;
192		}
193	}
194
195	mutex_destroy(&ctx->lock);
196	kfree(ctx);
197}
198
199int amdgpu_ctx_get_entity(struct amdgpu_ctx *ctx, u32 hw_ip, u32 instance,
200			  u32 ring, struct drm_sched_entity **entity)
201{
202	int r;
203
204	if (hw_ip >= AMDGPU_HW_IP_NUM) {
205		DRM_ERROR("unknown HW IP type: %d\n", hw_ip);
206		return -EINVAL;
207	}
208
209	/* Right now all IPs have only one instance - multiple rings. */
210	if (instance != 0) {
211		DRM_DEBUG("invalid ip instance: %d\n", instance);
212		return -EINVAL;
213	}
214
215	if (ring >= amdgpu_ctx_num_entities[hw_ip]) {
216		DRM_DEBUG("invalid ring: %d %d\n", hw_ip, ring);
217		return -EINVAL;
218	}
219
220	if (ctx->entities[hw_ip][ring] == NULL) {
221		r = amdgpu_ctx_init_entity(ctx, hw_ip, ring);
222		if (r)
223			return r;
224	}
225
226	*entity = &ctx->entities[hw_ip][ring]->entity;
227	return 0;
228}
229
230static int amdgpu_ctx_alloc(struct amdgpu_device *adev,
231			    struct amdgpu_fpriv *fpriv,
232			    struct drm_file *filp,
233			    enum drm_sched_priority priority,
234			    uint32_t *id)
235{
236	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
237	struct amdgpu_ctx *ctx;
238	int r;
239
240	ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
241	if (!ctx)
242		return -ENOMEM;
243
244	mutex_lock(&mgr->lock);
245	r = idr_alloc(&mgr->ctx_handles, ctx, 1, AMDGPU_VM_MAX_NUM_CTX, GFP_KERNEL);
246	if (r < 0) {
247		mutex_unlock(&mgr->lock);
248		kfree(ctx);
249		return r;
250	}
251
252	*id = (uint32_t)r;
253	r = amdgpu_ctx_init(adev, priority, filp, ctx);
254	if (r) {
255		idr_remove(&mgr->ctx_handles, *id);
256		*id = 0;
257		kfree(ctx);
258	}
259	mutex_unlock(&mgr->lock);
260	return r;
261}
262
263static void amdgpu_ctx_do_release(struct kref *ref)
264{
265	struct amdgpu_ctx *ctx;
266	u32 i, j;
267
268	ctx = container_of(ref, struct amdgpu_ctx, refcount);
269	for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
270		for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
271			if (!ctx->entities[i][j])
272				continue;
273
274			drm_sched_entity_destroy(&ctx->entities[i][j]->entity);
275		}
276	}
277
278	amdgpu_ctx_fini(ref);
279}
280
281static int amdgpu_ctx_free(struct amdgpu_fpriv *fpriv, uint32_t id)
282{
283	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
284	struct amdgpu_ctx *ctx;
285
286	mutex_lock(&mgr->lock);
287	ctx = idr_remove(&mgr->ctx_handles, id);
288	if (ctx)
289		kref_put(&ctx->refcount, amdgpu_ctx_do_release);
290	mutex_unlock(&mgr->lock);
291	return ctx ? 0 : -EINVAL;
292}
293
294static int amdgpu_ctx_query(struct amdgpu_device *adev,
295			    struct amdgpu_fpriv *fpriv, uint32_t id,
296			    union drm_amdgpu_ctx_out *out)
297{
298	struct amdgpu_ctx *ctx;
299	struct amdgpu_ctx_mgr *mgr;
300	unsigned reset_counter;
301
302	if (!fpriv)
303		return -EINVAL;
304
305	mgr = &fpriv->ctx_mgr;
306	mutex_lock(&mgr->lock);
307	ctx = idr_find(&mgr->ctx_handles, id);
308	if (!ctx) {
309		mutex_unlock(&mgr->lock);
310		return -EINVAL;
311	}
312
313	/* TODO: these two are always zero */
314	out->state.flags = 0x0;
315	out->state.hangs = 0x0;
316
317	/* determine if a GPU reset has occured since the last call */
318	reset_counter = atomic_read(&adev->gpu_reset_counter);
319	/* TODO: this should ideally return NO, GUILTY, or INNOCENT. */
320	if (ctx->reset_counter_query == reset_counter)
321		out->state.reset_status = AMDGPU_CTX_NO_RESET;
322	else
323		out->state.reset_status = AMDGPU_CTX_UNKNOWN_RESET;
324	ctx->reset_counter_query = reset_counter;
325
326	mutex_unlock(&mgr->lock);
327	return 0;
328}
329
330static int amdgpu_ctx_query2(struct amdgpu_device *adev,
331	struct amdgpu_fpriv *fpriv, uint32_t id,
332	union drm_amdgpu_ctx_out *out)
333{
334	struct amdgpu_ctx *ctx;
335	struct amdgpu_ctx_mgr *mgr;
336	unsigned long ras_counter;
337
338	if (!fpriv)
339		return -EINVAL;
340
341	mgr = &fpriv->ctx_mgr;
342	mutex_lock(&mgr->lock);
343	ctx = idr_find(&mgr->ctx_handles, id);
344	if (!ctx) {
345		mutex_unlock(&mgr->lock);
346		return -EINVAL;
347	}
348
349	out->state.flags = 0x0;
350	out->state.hangs = 0x0;
351
352	if (ctx->reset_counter != atomic_read(&adev->gpu_reset_counter))
353		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RESET;
354
355	if (ctx->vram_lost_counter != atomic_read(&adev->vram_lost_counter))
356		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_VRAMLOST;
357
358	if (atomic_read(&ctx->guilty))
359		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_GUILTY;
360
361	/*query ue count*/
362	ras_counter = amdgpu_ras_query_error_count(adev, false);
363	/*ras counter is monotonic increasing*/
364	if (ras_counter != ctx->ras_counter_ue) {
365		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RAS_UE;
366		ctx->ras_counter_ue = ras_counter;
367	}
368
369	/*query ce count*/
370	ras_counter = amdgpu_ras_query_error_count(adev, true);
371	if (ras_counter != ctx->ras_counter_ce) {
372		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RAS_CE;
373		ctx->ras_counter_ce = ras_counter;
374	}
375
376	mutex_unlock(&mgr->lock);
377	return 0;
378}
379
380int amdgpu_ctx_ioctl(struct drm_device *dev, void *data,
381		     struct drm_file *filp)
382{
383	int r;
384	uint32_t id;
385	enum drm_sched_priority priority;
386
387	union drm_amdgpu_ctx *args = data;
388	struct amdgpu_device *adev = dev->dev_private;
389	struct amdgpu_fpriv *fpriv = filp->driver_priv;
390
391	r = 0;
392	id = args->in.ctx_id;
393	priority = amdgpu_to_sched_priority(args->in.priority);
394
395	/* For backwards compatibility reasons, we need to accept
396	 * ioctls with garbage in the priority field */
397	if (priority == DRM_SCHED_PRIORITY_INVALID)
398		priority = DRM_SCHED_PRIORITY_NORMAL;
399
400	switch (args->in.op) {
401	case AMDGPU_CTX_OP_ALLOC_CTX:
402		r = amdgpu_ctx_alloc(adev, fpriv, filp, priority, &id);
403		args->out.alloc.ctx_id = id;
404		break;
405	case AMDGPU_CTX_OP_FREE_CTX:
406		r = amdgpu_ctx_free(fpriv, id);
407		break;
408	case AMDGPU_CTX_OP_QUERY_STATE:
409		r = amdgpu_ctx_query(adev, fpriv, id, &args->out);
410		break;
411	case AMDGPU_CTX_OP_QUERY_STATE2:
412		r = amdgpu_ctx_query2(adev, fpriv, id, &args->out);
413		break;
414	default:
415		return -EINVAL;
416	}
417
418	return r;
419}
420
421struct amdgpu_ctx *amdgpu_ctx_get(struct amdgpu_fpriv *fpriv, uint32_t id)
422{
423	struct amdgpu_ctx *ctx;
424	struct amdgpu_ctx_mgr *mgr;
425
426	if (!fpriv)
427		return NULL;
428
429	mgr = &fpriv->ctx_mgr;
430
431	mutex_lock(&mgr->lock);
432	ctx = idr_find(&mgr->ctx_handles, id);
433	if (ctx)
434		kref_get(&ctx->refcount);
435	mutex_unlock(&mgr->lock);
436	return ctx;
437}
438
439int amdgpu_ctx_put(struct amdgpu_ctx *ctx)
440{
441	if (ctx == NULL)
442		return -EINVAL;
443
444	kref_put(&ctx->refcount, amdgpu_ctx_do_release);
445	return 0;
446}
447
448void amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx,
449			  struct drm_sched_entity *entity,
450			  struct dma_fence *fence, uint64_t* handle)
451{
452	struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
453	uint64_t seq = centity->sequence;
454	struct dma_fence *other = NULL;
455	unsigned idx = 0;
 
456
457	idx = seq & (amdgpu_sched_jobs - 1);
458	other = centity->fences[idx];
459	if (other)
460		BUG_ON(!dma_fence_is_signaled(other));
461
462	dma_fence_get(fence);
463
464	spin_lock(&ctx->ring_lock);
465	centity->fences[idx] = fence;
466	centity->sequence++;
467	spin_unlock(&ctx->ring_lock);
468
469	dma_fence_put(other);
470	if (handle)
471		*handle = seq;
 
 
472}
473
474struct dma_fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx,
475				       struct drm_sched_entity *entity,
476				       uint64_t seq)
477{
478	struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
479	struct dma_fence *fence;
480
481	spin_lock(&ctx->ring_lock);
482
483	if (seq == ~0ull)
484		seq = centity->sequence - 1;
485
486	if (seq >= centity->sequence) {
487		spin_unlock(&ctx->ring_lock);
488		return ERR_PTR(-EINVAL);
489	}
490
491
492	if (seq + amdgpu_sched_jobs < centity->sequence) {
493		spin_unlock(&ctx->ring_lock);
494		return NULL;
495	}
496
497	fence = dma_fence_get(centity->fences[seq & (amdgpu_sched_jobs - 1)]);
498	spin_unlock(&ctx->ring_lock);
499
500	return fence;
501}
502
503static void amdgpu_ctx_set_entity_priority(struct amdgpu_ctx *ctx,
504					    struct amdgpu_ctx_entity *aentity,
505					    int hw_ip,
506					    enum drm_sched_priority priority)
507{
508	struct amdgpu_device *adev = ctx->adev;
509	unsigned int hw_prio;
510	struct drm_gpu_scheduler **scheds = NULL;
511	unsigned num_scheds;
512
513	/* set sw priority */
514	drm_sched_entity_set_priority(&aentity->entity, priority);
515
516	/* set hw priority */
517	if (hw_ip == AMDGPU_HW_IP_COMPUTE) {
518		hw_prio = amdgpu_ctx_prio_sched_to_hw(adev, priority,
519						      AMDGPU_HW_IP_COMPUTE);
520		hw_prio = array_index_nospec(hw_prio, AMDGPU_RING_PRIO_MAX);
521		scheds = adev->gpu_sched[hw_ip][hw_prio].sched;
522		num_scheds = adev->gpu_sched[hw_ip][hw_prio].num_scheds;
523		drm_sched_entity_modify_sched(&aentity->entity, scheds,
524					      num_scheds);
525	}
526}
527
528void amdgpu_ctx_priority_override(struct amdgpu_ctx *ctx,
529				  enum drm_sched_priority priority)
530{
 
 
 
 
 
531	enum drm_sched_priority ctx_prio;
532	unsigned i, j;
533
534	ctx->override_priority = priority;
535
536	ctx_prio = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
537			ctx->init_priority : ctx->override_priority;
538	for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
539		for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
540			if (!ctx->entities[i][j])
541				continue;
542
543			amdgpu_ctx_set_entity_priority(ctx, ctx->entities[i][j],
544						       i, ctx_prio);
545		}
 
 
 
 
 
 
546	}
547}
548
549int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx *ctx,
550			       struct drm_sched_entity *entity)
551{
552	struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
553	struct dma_fence *other;
554	unsigned idx;
555	long r;
556
557	spin_lock(&ctx->ring_lock);
558	idx = centity->sequence & (amdgpu_sched_jobs - 1);
559	other = dma_fence_get(centity->fences[idx]);
560	spin_unlock(&ctx->ring_lock);
561
562	if (!other)
563		return 0;
564
565	r = dma_fence_wait(other, true);
566	if (r < 0 && r != -ERESTARTSYS)
567		DRM_ERROR("Error (%ld) waiting for fence!\n", r);
568
569	dma_fence_put(other);
570	return r;
571}
572
573void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr)
574{
575	mutex_init(&mgr->lock);
576	idr_init(&mgr->ctx_handles);
577}
578
579long amdgpu_ctx_mgr_entity_flush(struct amdgpu_ctx_mgr *mgr, long timeout)
580{
581	struct amdgpu_ctx *ctx;
582	struct idr *idp;
583	uint32_t id, i, j;
584
585	idp = &mgr->ctx_handles;
586
587	mutex_lock(&mgr->lock);
588	idr_for_each_entry(idp, ctx, id) {
589		for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
590			for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
591				struct drm_sched_entity *entity;
592
593				if (!ctx->entities[i][j])
594					continue;
595
596				entity = &ctx->entities[i][j]->entity;
597				timeout = drm_sched_entity_flush(entity, timeout);
598			}
599		}
600	}
601	mutex_unlock(&mgr->lock);
602	return timeout;
603}
604
605void amdgpu_ctx_mgr_entity_fini(struct amdgpu_ctx_mgr *mgr)
606{
607	struct amdgpu_ctx *ctx;
608	struct idr *idp;
609	uint32_t id, i, j;
610
611	idp = &mgr->ctx_handles;
612
613	idr_for_each_entry(idp, ctx, id) {
614		if (kref_read(&ctx->refcount) != 1) {
615			DRM_ERROR("ctx %p is still alive\n", ctx);
616			continue;
617		}
618
619		for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
620			for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
621				struct drm_sched_entity *entity;
622
623				if (!ctx->entities[i][j])
624					continue;
625
626				entity = &ctx->entities[i][j]->entity;
627				drm_sched_entity_fini(entity);
628			}
629		}
630	}
631}
632
633void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr)
634{
635	struct amdgpu_ctx *ctx;
636	struct idr *idp;
637	uint32_t id;
638
639	amdgpu_ctx_mgr_entity_fini(mgr);
640
641	idp = &mgr->ctx_handles;
642
643	idr_for_each_entry(idp, ctx, id) {
644		if (kref_put(&ctx->refcount, amdgpu_ctx_fini) != 1)
645			DRM_ERROR("ctx %p is still alive\n", ctx);
646	}
647
648	idr_destroy(&mgr->ctx_handles);
649	mutex_destroy(&mgr->lock);
650}

  1/*
  2 * Copyright 2015 Advanced Micro Devices, Inc.
  3 *
  4 * Permission is hereby granted, free of charge, to any person obtaining a
  5 * copy of this software and associated documentation files (the "Software"),
  6 * to deal in the Software without restriction, including without limitation
  7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8 * and/or sell copies of the Software, and to permit persons to whom the
  9 * Software is furnished to do so, subject to the following conditions:
 10 *
 11 * The above copyright notice and this permission notice shall be included in
 12 * all copies or substantial portions of the Software.
 13 *
 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 20 * OTHER DEALINGS IN THE SOFTWARE.
 21 *
 22 * Authors: monk liu <monk.liu@amd.com>
 23 */
 24
 25#include <drm/drmP.h>
 26#include <drm/drm_auth.h>
 27#include "amdgpu.h"
 28#include "amdgpu_sched.h"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 29
 30static int amdgpu_ctx_priority_permit(struct drm_file *filp,
 31				      enum drm_sched_priority priority)
 32{
 
 
 
 33	/* NORMAL and below are accessible by everyone */
 34	if (priority <= DRM_SCHED_PRIORITY_NORMAL)
 35		return 0;
 36
 37	if (capable(CAP_SYS_NICE))
 38		return 0;
 39
 40	if (drm_is_current_master(filp))
 41		return 0;
 42
 43	return -EACCES;
 44}
 45
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 46static int amdgpu_ctx_init(struct amdgpu_device *adev,
 47			   enum drm_sched_priority priority,
 48			   struct drm_file *filp,
 49			   struct amdgpu_ctx *ctx)
 50{
 51	unsigned i, j;
 52	int r;
 53
 54	if (priority < 0 || priority >= DRM_SCHED_PRIORITY_MAX)
 55		return -EINVAL;
 56
 57	r = amdgpu_ctx_priority_permit(filp, priority);
 58	if (r)
 59		return r;
 60
 61	memset(ctx, 0, sizeof(*ctx));
 
 62	ctx->adev = adev;
 
 63	kref_init(&ctx->refcount);
 64	spin_lock_init(&ctx->ring_lock);
 65	ctx->fences = kcalloc(amdgpu_sched_jobs * AMDGPU_MAX_RINGS,
 66			      sizeof(struct dma_fence*), GFP_KERNEL);
 67	if (!ctx->fences)
 68		return -ENOMEM;
 69
 70	mutex_init(&ctx->lock);
 71
 72	for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
 73		ctx->rings[i].sequence = 1;
 74		ctx->rings[i].fences = &ctx->fences[amdgpu_sched_jobs * i];
 75	}
 76
 77	ctx->reset_counter = atomic_read(&adev->gpu_reset_counter);
 78	ctx->reset_counter_query = ctx->reset_counter;
 79	ctx->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
 80	ctx->init_priority = priority;
 81	ctx->override_priority = DRM_SCHED_PRIORITY_UNSET;
 82
 83	/* create context entity for each ring */
 84	for (i = 0; i < adev->num_rings; i++) {
 85		struct amdgpu_ring *ring = adev->rings[i];
 86		struct drm_sched_rq *rq;
 87
 88		rq = &ring->sched.sched_rq[priority];
 
 89
 90		if (ring == &adev->gfx.kiq.ring)
 91			continue;
 92
 93		r = drm_sched_entity_init(&ring->sched, &ctx->rings[i].entity,
 94					  rq, amdgpu_sched_jobs, &ctx->guilty);
 95		if (r)
 96			goto failed;
 97	}
 98
 99	r = amdgpu_queue_mgr_init(adev, &ctx->queue_mgr);
100	if (r)
101		goto failed;
102
103	return 0;
 
104
105failed:
106	for (j = 0; j < i; j++)
107		drm_sched_entity_fini(&adev->rings[j]->sched,
108				      &ctx->rings[j].entity);
109	kfree(ctx->fences);
110	ctx->fences = NULL;
111	return r;
112}
113
114static void amdgpu_ctx_fini(struct amdgpu_ctx *ctx)
115{
 
116	struct amdgpu_device *adev = ctx->adev;
117	unsigned i, j;
118
119	if (!adev)
120		return;
121
122	for (i = 0; i < AMDGPU_MAX_RINGS; ++i)
123		for (j = 0; j < amdgpu_sched_jobs; ++j)
124			dma_fence_put(ctx->rings[i].fences[j]);
125	kfree(ctx->fences);
126	ctx->fences = NULL;
127
128	for (i = 0; i < adev->num_rings; i++)
129		drm_sched_entity_fini(&adev->rings[i]->sched,
130				      &ctx->rings[i].entity);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
131
132	amdgpu_queue_mgr_fini(adev, &ctx->queue_mgr);
 
 
 
 
133
134	mutex_destroy(&ctx->lock);
 
135}
136
137static int amdgpu_ctx_alloc(struct amdgpu_device *adev,
138			    struct amdgpu_fpriv *fpriv,
139			    struct drm_file *filp,
140			    enum drm_sched_priority priority,
141			    uint32_t *id)
142{
143	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
144	struct amdgpu_ctx *ctx;
145	int r;
146
147	ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
148	if (!ctx)
149		return -ENOMEM;
150
151	mutex_lock(&mgr->lock);
152	r = idr_alloc(&mgr->ctx_handles, ctx, 1, 0, GFP_KERNEL);
153	if (r < 0) {
154		mutex_unlock(&mgr->lock);
155		kfree(ctx);
156		return r;
157	}
158
159	*id = (uint32_t)r;
160	r = amdgpu_ctx_init(adev, priority, filp, ctx);
161	if (r) {
162		idr_remove(&mgr->ctx_handles, *id);
163		*id = 0;
164		kfree(ctx);
165	}
166	mutex_unlock(&mgr->lock);
167	return r;
168}
169
170static void amdgpu_ctx_do_release(struct kref *ref)
171{
172	struct amdgpu_ctx *ctx;
 
173
174	ctx = container_of(ref, struct amdgpu_ctx, refcount);
 
 
 
 
175
176	amdgpu_ctx_fini(ctx);
 
 
177
178	kfree(ctx);
179}
180
181static int amdgpu_ctx_free(struct amdgpu_fpriv *fpriv, uint32_t id)
182{
183	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
184	struct amdgpu_ctx *ctx;
185
186	mutex_lock(&mgr->lock);
187	ctx = idr_remove(&mgr->ctx_handles, id);
188	if (ctx)
189		kref_put(&ctx->refcount, amdgpu_ctx_do_release);
190	mutex_unlock(&mgr->lock);
191	return ctx ? 0 : -EINVAL;
192}
193
194static int amdgpu_ctx_query(struct amdgpu_device *adev,
195			    struct amdgpu_fpriv *fpriv, uint32_t id,
196			    union drm_amdgpu_ctx_out *out)
197{
198	struct amdgpu_ctx *ctx;
199	struct amdgpu_ctx_mgr *mgr;
200	unsigned reset_counter;
201
202	if (!fpriv)
203		return -EINVAL;
204
205	mgr = &fpriv->ctx_mgr;
206	mutex_lock(&mgr->lock);
207	ctx = idr_find(&mgr->ctx_handles, id);
208	if (!ctx) {
209		mutex_unlock(&mgr->lock);
210		return -EINVAL;
211	}
212
213	/* TODO: these two are always zero */
214	out->state.flags = 0x0;
215	out->state.hangs = 0x0;
216
217	/* determine if a GPU reset has occured since the last call */
218	reset_counter = atomic_read(&adev->gpu_reset_counter);
219	/* TODO: this should ideally return NO, GUILTY, or INNOCENT. */
220	if (ctx->reset_counter_query == reset_counter)
221		out->state.reset_status = AMDGPU_CTX_NO_RESET;
222	else
223		out->state.reset_status = AMDGPU_CTX_UNKNOWN_RESET;
224	ctx->reset_counter_query = reset_counter;
225
226	mutex_unlock(&mgr->lock);
227	return 0;
228}
229
230static int amdgpu_ctx_query2(struct amdgpu_device *adev,
231	struct amdgpu_fpriv *fpriv, uint32_t id,
232	union drm_amdgpu_ctx_out *out)
233{
234	struct amdgpu_ctx *ctx;
235	struct amdgpu_ctx_mgr *mgr;
 
236
237	if (!fpriv)
238		return -EINVAL;
239
240	mgr = &fpriv->ctx_mgr;
241	mutex_lock(&mgr->lock);
242	ctx = idr_find(&mgr->ctx_handles, id);
243	if (!ctx) {
244		mutex_unlock(&mgr->lock);
245		return -EINVAL;
246	}
247
248	out->state.flags = 0x0;
249	out->state.hangs = 0x0;
250
251	if (ctx->reset_counter != atomic_read(&adev->gpu_reset_counter))
252		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RESET;
253
254	if (ctx->vram_lost_counter != atomic_read(&adev->vram_lost_counter))
255		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_VRAMLOST;
256
257	if (atomic_read(&ctx->guilty))
258		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_GUILTY;
259
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
260	mutex_unlock(&mgr->lock);
261	return 0;
262}
263
264int amdgpu_ctx_ioctl(struct drm_device *dev, void *data,
265		     struct drm_file *filp)
266{
267	int r;
268	uint32_t id;
269	enum drm_sched_priority priority;
270
271	union drm_amdgpu_ctx *args = data;
272	struct amdgpu_device *adev = dev->dev_private;
273	struct amdgpu_fpriv *fpriv = filp->driver_priv;
274
275	r = 0;
276	id = args->in.ctx_id;
277	priority = amdgpu_to_sched_priority(args->in.priority);
278
279	/* For backwards compatibility reasons, we need to accept
280	 * ioctls with garbage in the priority field */
281	if (priority == DRM_SCHED_PRIORITY_INVALID)
282		priority = DRM_SCHED_PRIORITY_NORMAL;
283
284	switch (args->in.op) {
285	case AMDGPU_CTX_OP_ALLOC_CTX:
286		r = amdgpu_ctx_alloc(adev, fpriv, filp, priority, &id);
287		args->out.alloc.ctx_id = id;
288		break;
289	case AMDGPU_CTX_OP_FREE_CTX:
290		r = amdgpu_ctx_free(fpriv, id);
291		break;
292	case AMDGPU_CTX_OP_QUERY_STATE:
293		r = amdgpu_ctx_query(adev, fpriv, id, &args->out);
294		break;
295	case AMDGPU_CTX_OP_QUERY_STATE2:
296		r = amdgpu_ctx_query2(adev, fpriv, id, &args->out);
297		break;
298	default:
299		return -EINVAL;
300	}
301
302	return r;
303}
304
305struct amdgpu_ctx *amdgpu_ctx_get(struct amdgpu_fpriv *fpriv, uint32_t id)
306{
307	struct amdgpu_ctx *ctx;
308	struct amdgpu_ctx_mgr *mgr;
309
310	if (!fpriv)
311		return NULL;
312
313	mgr = &fpriv->ctx_mgr;
314
315	mutex_lock(&mgr->lock);
316	ctx = idr_find(&mgr->ctx_handles, id);
317	if (ctx)
318		kref_get(&ctx->refcount);
319	mutex_unlock(&mgr->lock);
320	return ctx;
321}
322
323int amdgpu_ctx_put(struct amdgpu_ctx *ctx)
324{
325	if (ctx == NULL)
326		return -EINVAL;
327
328	kref_put(&ctx->refcount, amdgpu_ctx_do_release);
329	return 0;
330}
331
332int amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx, struct amdgpu_ring *ring,
333			      struct dma_fence *fence, uint64_t* handler)
 
334{
335	struct amdgpu_ctx_ring *cring = & ctx->rings[ring->idx];
336	uint64_t seq = cring->sequence;
 
337	unsigned idx = 0;
338	struct dma_fence *other = NULL;
339
340	idx = seq & (amdgpu_sched_jobs - 1);
341	other = cring->fences[idx];
342	if (other)
343		BUG_ON(!dma_fence_is_signaled(other));
344
345	dma_fence_get(fence);
346
347	spin_lock(&ctx->ring_lock);
348	cring->fences[idx] = fence;
349	cring->sequence++;
350	spin_unlock(&ctx->ring_lock);
351
352	dma_fence_put(other);
353	if (handler)
354		*handler = seq;
355
356	return 0;
357}
358
359struct dma_fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx,
360				       struct amdgpu_ring *ring, uint64_t seq)
 
361{
362	struct amdgpu_ctx_ring *cring = & ctx->rings[ring->idx];
363	struct dma_fence *fence;
364
365	spin_lock(&ctx->ring_lock);
366
367	if (seq == ~0ull)
368		seq = ctx->rings[ring->idx].sequence - 1;
369
370	if (seq >= cring->sequence) {
371		spin_unlock(&ctx->ring_lock);
372		return ERR_PTR(-EINVAL);
373	}
374
375
376	if (seq + amdgpu_sched_jobs < cring->sequence) {
377		spin_unlock(&ctx->ring_lock);
378		return NULL;
379	}
380
381	fence = dma_fence_get(cring->fences[seq & (amdgpu_sched_jobs - 1)]);
382	spin_unlock(&ctx->ring_lock);
383
384	return fence;
385}
386
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
387void amdgpu_ctx_priority_override(struct amdgpu_ctx *ctx,
388				  enum drm_sched_priority priority)
389{
390	int i;
391	struct amdgpu_device *adev = ctx->adev;
392	struct drm_sched_rq *rq;
393	struct drm_sched_entity *entity;
394	struct amdgpu_ring *ring;
395	enum drm_sched_priority ctx_prio;
 
396
397	ctx->override_priority = priority;
398
399	ctx_prio = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
400			ctx->init_priority : ctx->override_priority;
 
 
 
 
401
402	for (i = 0; i < adev->num_rings; i++) {
403		ring = adev->rings[i];
404		entity = &ctx->rings[i].entity;
405		rq = &ring->sched.sched_rq[ctx_prio];
406
407		if (ring->funcs->type == AMDGPU_RING_TYPE_KIQ)
408			continue;
409
410		drm_sched_entity_set_rq(entity, rq);
411	}
412}
413
414int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx *ctx, unsigned ring_id)
 
415{
416	struct amdgpu_ctx_ring *cring = &ctx->rings[ring_id];
417	unsigned idx = cring->sequence & (amdgpu_sched_jobs - 1);
418	struct dma_fence *other = cring->fences[idx];
 
419
420	if (other) {
421		signed long r;
422		r = dma_fence_wait(other, true);
423		if (r < 0) {
424			if (r != -ERESTARTSYS)
425				DRM_ERROR("Error (%ld) waiting for fence!\n", r);
 
426
427			return r;
428		}
429	}
430
431	return 0;
 
432}
433
434void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr)
435{
436	mutex_init(&mgr->lock);
437	idr_init(&mgr->ctx_handles);
438}
439
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
440void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr)
441{
442	struct amdgpu_ctx *ctx;
443	struct idr *idp;
444	uint32_t id;
445
 
 
446	idp = &mgr->ctx_handles;
447
448	idr_for_each_entry(idp, ctx, id) {
449		if (kref_put(&ctx->refcount, amdgpu_ctx_do_release) != 1)
450			DRM_ERROR("ctx %p is still alive\n", ctx);
451	}
452
453	idr_destroy(&mgr->ctx_handles);
454	mutex_destroy(&mgr->lock);
455}