amdgpu_ctx.c - drivers/gpu/drm/amd/amdgpu/amdgpu_ctx.c - Linux diff v5.9

  1/*
  2 * Copyright 2015 Advanced Micro Devices, Inc.
  3 *
  4 * Permission is hereby granted, free of charge, to any person obtaining a
  5 * copy of this software and associated documentation files (the "Software"),
  6 * to deal in the Software without restriction, including without limitation
  7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8 * and/or sell copies of the Software, and to permit persons to whom the
  9 * Software is furnished to do so, subject to the following conditions:
 10 *
 11 * The above copyright notice and this permission notice shall be included in
 12 * all copies or substantial portions of the Software.
 13 *
 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 20 * OTHER DEALINGS IN THE SOFTWARE.
 21 *
 22 * Authors: monk liu <monk.liu@amd.com>
 23 */
 24
 25#include <drm/drm_auth.h>
 26#include "amdgpu.h"
 27#include "amdgpu_sched.h"
 28#include "amdgpu_ras.h"
 29#include <linux/nospec.h>
 30
 31#define to_amdgpu_ctx_entity(e)	\
 32	container_of((e), struct amdgpu_ctx_entity, entity)
 33
 34const unsigned int amdgpu_ctx_num_entities[AMDGPU_HW_IP_NUM] = {
 35	[AMDGPU_HW_IP_GFX]	=	1,
 36	[AMDGPU_HW_IP_COMPUTE]	=	4,
 37	[AMDGPU_HW_IP_DMA]	=	2,
 38	[AMDGPU_HW_IP_UVD]	=	1,
 39	[AMDGPU_HW_IP_VCE]	=	1,
 40	[AMDGPU_HW_IP_UVD_ENC]	=	1,
 41	[AMDGPU_HW_IP_VCN_DEC]	=	1,
 42	[AMDGPU_HW_IP_VCN_ENC]	=	1,
 43	[AMDGPU_HW_IP_VCN_JPEG]	=	1,
 44};
 45
 46static int amdgpu_ctx_priority_permit(struct drm_file *filp,
 47				      enum drm_sched_priority priority)
 48{
 49	if (priority < 0 || priority >= DRM_SCHED_PRIORITY_MAX)
 50		return -EINVAL;
 51
 52	/* NORMAL and below are accessible by everyone */
 53	if (priority <= DRM_SCHED_PRIORITY_NORMAL)
 54		return 0;
 55
 56	if (capable(CAP_SYS_NICE))
 57		return 0;
 58
 59	if (drm_is_current_master(filp))
 60		return 0;
 61
 62	return -EACCES;
 63}
 64
 65static enum gfx_pipe_priority amdgpu_ctx_sched_prio_to_compute_prio(enum drm_sched_priority prio)
 66{
 67	switch (prio) {
 68	case DRM_SCHED_PRIORITY_HIGH_HW:
 69	case DRM_SCHED_PRIORITY_KERNEL:
 70		return AMDGPU_GFX_PIPE_PRIO_HIGH;
 71	default:
 72		return AMDGPU_GFX_PIPE_PRIO_NORMAL;
 73	}
 74}
 75
 76static unsigned int amdgpu_ctx_prio_sched_to_hw(struct amdgpu_device *adev,
 77						 enum drm_sched_priority prio,
 78						 u32 hw_ip)
 79{
 80	unsigned int hw_prio;
 81
 82	hw_prio = (hw_ip == AMDGPU_HW_IP_COMPUTE) ?
 83			amdgpu_ctx_sched_prio_to_compute_prio(prio) :
 84			AMDGPU_RING_PRIO_DEFAULT;
 85	hw_ip = array_index_nospec(hw_ip, AMDGPU_HW_IP_NUM);
 86	if (adev->gpu_sched[hw_ip][hw_prio].num_scheds == 0)
 87		hw_prio = AMDGPU_RING_PRIO_DEFAULT;
 88
 89	return hw_prio;
 90}
 91
 92static int amdgpu_ctx_init_entity(struct amdgpu_ctx *ctx, u32 hw_ip,
 93				   const u32 ring)
 94{
 95	struct amdgpu_device *adev = ctx->adev;
 96	struct amdgpu_ctx_entity *entity;
 97	struct drm_gpu_scheduler **scheds = NULL, *sched = NULL;
 98	unsigned num_scheds = 0;
 99	unsigned int hw_prio;
100	enum drm_sched_priority priority;
101	int r;
102
103	entity = kcalloc(1, offsetof(typeof(*entity), fences[amdgpu_sched_jobs]),
104			 GFP_KERNEL);
105	if (!entity)
106		return  -ENOMEM;
107
108	entity->sequence = 1;
109	priority = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
110				ctx->init_priority : ctx->override_priority;
111	hw_prio = amdgpu_ctx_prio_sched_to_hw(adev, priority, hw_ip);
112
113	hw_ip = array_index_nospec(hw_ip, AMDGPU_HW_IP_NUM);
114	scheds = adev->gpu_sched[hw_ip][hw_prio].sched;
115	num_scheds = adev->gpu_sched[hw_ip][hw_prio].num_scheds;
116
117	if (hw_ip == AMDGPU_HW_IP_VCN_ENC || hw_ip == AMDGPU_HW_IP_VCN_DEC) {
118		sched = drm_sched_pick_best(scheds, num_scheds);
119		scheds = &sched;
120		num_scheds = 1;
121	}
122
123	r = drm_sched_entity_init(&entity->entity, priority, scheds, num_scheds,
124				  &ctx->guilty);
125	if (r)
126		goto error_free_entity;
127
128	ctx->entities[hw_ip][ring] = entity;
129	return 0;
130
131error_free_entity:
132	kfree(entity);
133
134	return r;
135}
136
137static int amdgpu_ctx_init(struct amdgpu_device *adev,
138			   enum drm_sched_priority priority,
139			   struct drm_file *filp,
140			   struct amdgpu_ctx *ctx)
141{
 
142	int r;
143
144	r = amdgpu_ctx_priority_permit(filp, priority);
145	if (r)
146		return r;
147
148	memset(ctx, 0, sizeof(*ctx));
149
150	ctx->adev = adev;
151
152	kref_init(&ctx->refcount);
153	spin_lock_init(&ctx->ring_lock);
154	mutex_init(&ctx->lock);
 
 
 
155
156	ctx->reset_counter = atomic_read(&adev->gpu_reset_counter);
157	ctx->reset_counter_query = ctx->reset_counter;
158	ctx->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
159	ctx->init_priority = priority;
160	ctx->override_priority = DRM_SCHED_PRIORITY_UNSET;
 
 
 
 
 
 
 
 
 
 
161
 
 
 
 
 
 
 
162	return 0;
163}
164
165static void amdgpu_ctx_fini_entity(struct amdgpu_ctx_entity *entity)
166{
167
168	int i;
169
170	if (!entity)
171		return;
172
173	for (i = 0; i < amdgpu_sched_jobs; ++i)
174		dma_fence_put(entity->fences[i]);
175
176	kfree(entity);
177}
178
179static void amdgpu_ctx_fini(struct kref *ref)
180{
181	struct amdgpu_ctx *ctx = container_of(ref, struct amdgpu_ctx, refcount);
182	struct amdgpu_device *adev = ctx->adev;
183	unsigned i, j;
184
185	if (!adev)
186		return;
187
188	for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
189		for (j = 0; j < AMDGPU_MAX_ENTITY_NUM; ++j) {
190			amdgpu_ctx_fini_entity(ctx->entities[i][j]);
191			ctx->entities[i][j] = NULL;
192		}
193	}
194
195	mutex_destroy(&ctx->lock);
196	kfree(ctx);
197}
198
199int amdgpu_ctx_get_entity(struct amdgpu_ctx *ctx, u32 hw_ip, u32 instance,
200			  u32 ring, struct drm_sched_entity **entity)
201{
202	int r;
203
204	if (hw_ip >= AMDGPU_HW_IP_NUM) {
205		DRM_ERROR("unknown HW IP type: %d\n", hw_ip);
206		return -EINVAL;
207	}
208
209	/* Right now all IPs have only one instance - multiple rings. */
210	if (instance != 0) {
211		DRM_DEBUG("invalid ip instance: %d\n", instance);
212		return -EINVAL;
213	}
214
215	if (ring >= amdgpu_ctx_num_entities[hw_ip]) {
216		DRM_DEBUG("invalid ring: %d %d\n", hw_ip, ring);
217		return -EINVAL;
218	}
219
220	if (ctx->entities[hw_ip][ring] == NULL) {
221		r = amdgpu_ctx_init_entity(ctx, hw_ip, ring);
222		if (r)
223			return r;
224	}
225
226	*entity = &ctx->entities[hw_ip][ring]->entity;
227	return 0;
228}
229
230static int amdgpu_ctx_alloc(struct amdgpu_device *adev,
231			    struct amdgpu_fpriv *fpriv,
232			    struct drm_file *filp,
233			    enum drm_sched_priority priority,
234			    uint32_t *id)
235{
236	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
237	struct amdgpu_ctx *ctx;
238	int r;
239
240	ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
241	if (!ctx)
242		return -ENOMEM;
243
244	mutex_lock(&mgr->lock);
245	r = idr_alloc(&mgr->ctx_handles, ctx, 1, AMDGPU_VM_MAX_NUM_CTX, GFP_KERNEL);
246	if (r < 0) {
247		mutex_unlock(&mgr->lock);
248		kfree(ctx);
249		return r;
250	}
251
252	*id = (uint32_t)r;
253	r = amdgpu_ctx_init(adev, priority, filp, ctx);
254	if (r) {
255		idr_remove(&mgr->ctx_handles, *id);
256		*id = 0;
257		kfree(ctx);
258	}
259	mutex_unlock(&mgr->lock);
260	return r;
261}
262
263static void amdgpu_ctx_do_release(struct kref *ref)
264{
265	struct amdgpu_ctx *ctx;
266	u32 i, j;
267
268	ctx = container_of(ref, struct amdgpu_ctx, refcount);
269	for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
270		for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
271			if (!ctx->entities[i][j])
272				continue;
273
274			drm_sched_entity_destroy(&ctx->entities[i][j]->entity);
275		}
276	}
277
278	amdgpu_ctx_fini(ref);
279}
280
281static int amdgpu_ctx_free(struct amdgpu_fpriv *fpriv, uint32_t id)
282{
283	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
284	struct amdgpu_ctx *ctx;
285
286	mutex_lock(&mgr->lock);
287	ctx = idr_remove(&mgr->ctx_handles, id);
288	if (ctx)
 
289		kref_put(&ctx->refcount, amdgpu_ctx_do_release);
 
 
 
290	mutex_unlock(&mgr->lock);
291	return ctx ? 0 : -EINVAL;
292}
293
294static int amdgpu_ctx_query(struct amdgpu_device *adev,
295			    struct amdgpu_fpriv *fpriv, uint32_t id,
296			    union drm_amdgpu_ctx_out *out)
297{
298	struct amdgpu_ctx *ctx;
299	struct amdgpu_ctx_mgr *mgr;
300	unsigned reset_counter;
301
302	if (!fpriv)
303		return -EINVAL;
304
305	mgr = &fpriv->ctx_mgr;
306	mutex_lock(&mgr->lock);
307	ctx = idr_find(&mgr->ctx_handles, id);
308	if (!ctx) {
309		mutex_unlock(&mgr->lock);
310		return -EINVAL;
311	}
312
313	/* TODO: these two are always zero */
314	out->state.flags = 0x0;
315	out->state.hangs = 0x0;
316
317	/* determine if a GPU reset has occured since the last call */
318	reset_counter = atomic_read(&adev->gpu_reset_counter);
319	/* TODO: this should ideally return NO, GUILTY, or INNOCENT. */
320	if (ctx->reset_counter_query == reset_counter)
321		out->state.reset_status = AMDGPU_CTX_NO_RESET;
322	else
323		out->state.reset_status = AMDGPU_CTX_UNKNOWN_RESET;
324	ctx->reset_counter_query = reset_counter;
325
326	mutex_unlock(&mgr->lock);
327	return 0;
328}
329
330static int amdgpu_ctx_query2(struct amdgpu_device *adev,
331	struct amdgpu_fpriv *fpriv, uint32_t id,
332	union drm_amdgpu_ctx_out *out)
333{
334	struct amdgpu_ctx *ctx;
335	struct amdgpu_ctx_mgr *mgr;
336	unsigned long ras_counter;
337
338	if (!fpriv)
339		return -EINVAL;
340
341	mgr = &fpriv->ctx_mgr;
342	mutex_lock(&mgr->lock);
343	ctx = idr_find(&mgr->ctx_handles, id);
344	if (!ctx) {
345		mutex_unlock(&mgr->lock);
346		return -EINVAL;
347	}
348
349	out->state.flags = 0x0;
350	out->state.hangs = 0x0;
351
352	if (ctx->reset_counter != atomic_read(&adev->gpu_reset_counter))
353		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RESET;
354
355	if (ctx->vram_lost_counter != atomic_read(&adev->vram_lost_counter))
356		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_VRAMLOST;
357
358	if (atomic_read(&ctx->guilty))
359		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_GUILTY;
360
361	/*query ue count*/
362	ras_counter = amdgpu_ras_query_error_count(adev, false);
363	/*ras counter is monotonic increasing*/
364	if (ras_counter != ctx->ras_counter_ue) {
365		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RAS_UE;
366		ctx->ras_counter_ue = ras_counter;
367	}
368
369	/*query ce count*/
370	ras_counter = amdgpu_ras_query_error_count(adev, true);
371	if (ras_counter != ctx->ras_counter_ce) {
372		out->state.flags |= AMDGPU_CTX_QUERY2_FLAGS_RAS_CE;
373		ctx->ras_counter_ce = ras_counter;
374	}
375
376	mutex_unlock(&mgr->lock);
377	return 0;
378}
379
380int amdgpu_ctx_ioctl(struct drm_device *dev, void *data,
381		     struct drm_file *filp)
382{
383	int r;
384	uint32_t id;
385	enum drm_sched_priority priority;
386
387	union drm_amdgpu_ctx *args = data;
388	struct amdgpu_device *adev = dev->dev_private;
389	struct amdgpu_fpriv *fpriv = filp->driver_priv;
390
391	r = 0;
392	id = args->in.ctx_id;
393	priority = amdgpu_to_sched_priority(args->in.priority);
394
395	/* For backwards compatibility reasons, we need to accept
396	 * ioctls with garbage in the priority field */
397	if (priority == DRM_SCHED_PRIORITY_INVALID)
398		priority = DRM_SCHED_PRIORITY_NORMAL;
399
400	switch (args->in.op) {
401	case AMDGPU_CTX_OP_ALLOC_CTX:
402		r = amdgpu_ctx_alloc(adev, fpriv, filp, priority, &id);
403		args->out.alloc.ctx_id = id;
404		break;
405	case AMDGPU_CTX_OP_FREE_CTX:
406		r = amdgpu_ctx_free(fpriv, id);
407		break;
408	case AMDGPU_CTX_OP_QUERY_STATE:
409		r = amdgpu_ctx_query(adev, fpriv, id, &args->out);
410		break;
411	case AMDGPU_CTX_OP_QUERY_STATE2:
412		r = amdgpu_ctx_query2(adev, fpriv, id, &args->out);
413		break;
414	default:
415		return -EINVAL;
416	}
417
418	return r;
419}
420
421struct amdgpu_ctx *amdgpu_ctx_get(struct amdgpu_fpriv *fpriv, uint32_t id)
422{
423	struct amdgpu_ctx *ctx;
424	struct amdgpu_ctx_mgr *mgr;
425
426	if (!fpriv)
427		return NULL;
428
429	mgr = &fpriv->ctx_mgr;
430
431	mutex_lock(&mgr->lock);
432	ctx = idr_find(&mgr->ctx_handles, id);
433	if (ctx)
434		kref_get(&ctx->refcount);
435	mutex_unlock(&mgr->lock);
436	return ctx;
437}
438
439int amdgpu_ctx_put(struct amdgpu_ctx *ctx)
440{
441	if (ctx == NULL)
442		return -EINVAL;
443
444	kref_put(&ctx->refcount, amdgpu_ctx_do_release);
445	return 0;
446}
447
448void amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx,
449			  struct drm_sched_entity *entity,
450			  struct dma_fence *fence, uint64_t* handle)
451{
452	struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
453	uint64_t seq = centity->sequence;
454	struct dma_fence *other = NULL;
455	unsigned idx = 0;
 
456
457	idx = seq & (amdgpu_sched_jobs - 1);
458	other = centity->fences[idx];
459	if (other)
460		BUG_ON(!dma_fence_is_signaled(other));
 
 
 
 
461
462	dma_fence_get(fence);
463
464	spin_lock(&ctx->ring_lock);
465	centity->fences[idx] = fence;
466	centity->sequence++;
467	spin_unlock(&ctx->ring_lock);
468
469	dma_fence_put(other);
470	if (handle)
471		*handle = seq;
472}
473
474struct dma_fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx,
475				       struct drm_sched_entity *entity,
476				       uint64_t seq)
477{
478	struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
479	struct dma_fence *fence;
480
481	spin_lock(&ctx->ring_lock);
482
483	if (seq == ~0ull)
484		seq = centity->sequence - 1;
485
486	if (seq >= centity->sequence) {
487		spin_unlock(&ctx->ring_lock);
488		return ERR_PTR(-EINVAL);
489	}
490
491
492	if (seq + amdgpu_sched_jobs < centity->sequence) {
493		spin_unlock(&ctx->ring_lock);
494		return NULL;
495	}
496
497	fence = dma_fence_get(centity->fences[seq & (amdgpu_sched_jobs - 1)]);
498	spin_unlock(&ctx->ring_lock);
499
500	return fence;
501}
502
503static void amdgpu_ctx_set_entity_priority(struct amdgpu_ctx *ctx,
504					    struct amdgpu_ctx_entity *aentity,
505					    int hw_ip,
506					    enum drm_sched_priority priority)
507{
508	struct amdgpu_device *adev = ctx->adev;
509	unsigned int hw_prio;
510	struct drm_gpu_scheduler **scheds = NULL;
511	unsigned num_scheds;
512
513	/* set sw priority */
514	drm_sched_entity_set_priority(&aentity->entity, priority);
515
516	/* set hw priority */
517	if (hw_ip == AMDGPU_HW_IP_COMPUTE) {
518		hw_prio = amdgpu_ctx_prio_sched_to_hw(adev, priority,
519						      AMDGPU_HW_IP_COMPUTE);
520		hw_prio = array_index_nospec(hw_prio, AMDGPU_RING_PRIO_MAX);
521		scheds = adev->gpu_sched[hw_ip][hw_prio].sched;
522		num_scheds = adev->gpu_sched[hw_ip][hw_prio].num_scheds;
523		drm_sched_entity_modify_sched(&aentity->entity, scheds,
524					      num_scheds);
525	}
526}
527
528void amdgpu_ctx_priority_override(struct amdgpu_ctx *ctx,
529				  enum drm_sched_priority priority)
530{
531	enum drm_sched_priority ctx_prio;
532	unsigned i, j;
533
534	ctx->override_priority = priority;
535
536	ctx_prio = (ctx->override_priority == DRM_SCHED_PRIORITY_UNSET) ?
537			ctx->init_priority : ctx->override_priority;
538	for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
539		for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
540			if (!ctx->entities[i][j])
541				continue;
542
543			amdgpu_ctx_set_entity_priority(ctx, ctx->entities[i][j],
544						       i, ctx_prio);
545		}
546	}
547}
548
549int amdgpu_ctx_wait_prev_fence(struct amdgpu_ctx *ctx,
550			       struct drm_sched_entity *entity)
551{
552	struct amdgpu_ctx_entity *centity = to_amdgpu_ctx_entity(entity);
553	struct dma_fence *other;
554	unsigned idx;
555	long r;
556
557	spin_lock(&ctx->ring_lock);
558	idx = centity->sequence & (amdgpu_sched_jobs - 1);
559	other = dma_fence_get(centity->fences[idx]);
560	spin_unlock(&ctx->ring_lock);
561
562	if (!other)
563		return 0;
564
565	r = dma_fence_wait(other, true);
566	if (r < 0 && r != -ERESTARTSYS)
567		DRM_ERROR("Error (%ld) waiting for fence!\n", r);
568
569	dma_fence_put(other);
570	return r;
571}
572
573void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr)
574{
575	mutex_init(&mgr->lock);
576	idr_init(&mgr->ctx_handles);
577}
578
579long amdgpu_ctx_mgr_entity_flush(struct amdgpu_ctx_mgr *mgr, long timeout)
580{
581	struct amdgpu_ctx *ctx;
582	struct idr *idp;
583	uint32_t id, i, j;
584
585	idp = &mgr->ctx_handles;
586
587	mutex_lock(&mgr->lock);
588	idr_for_each_entry(idp, ctx, id) {
589		for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
590			for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
591				struct drm_sched_entity *entity;
592
593				if (!ctx->entities[i][j])
594					continue;
595
596				entity = &ctx->entities[i][j]->entity;
597				timeout = drm_sched_entity_flush(entity, timeout);
598			}
599		}
600	}
601	mutex_unlock(&mgr->lock);
602	return timeout;
603}
604
605void amdgpu_ctx_mgr_entity_fini(struct amdgpu_ctx_mgr *mgr)
606{
607	struct amdgpu_ctx *ctx;
608	struct idr *idp;
609	uint32_t id, i, j;
610
611	idp = &mgr->ctx_handles;
612
613	idr_for_each_entry(idp, ctx, id) {
614		if (kref_read(&ctx->refcount) != 1) {
615			DRM_ERROR("ctx %p is still alive\n", ctx);
616			continue;
617		}
618
619		for (i = 0; i < AMDGPU_HW_IP_NUM; ++i) {
620			for (j = 0; j < amdgpu_ctx_num_entities[i]; ++j) {
621				struct drm_sched_entity *entity;
622
623				if (!ctx->entities[i][j])
624					continue;
625
626				entity = &ctx->entities[i][j]->entity;
627				drm_sched_entity_fini(entity);
628			}
629		}
630	}
631}
632
633void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr)
634{
635	struct amdgpu_ctx *ctx;
636	struct idr *idp;
637	uint32_t id;
638
639	amdgpu_ctx_mgr_entity_fini(mgr);
640
641	idp = &mgr->ctx_handles;
642
643	idr_for_each_entry(idp, ctx, id) {
644		if (kref_put(&ctx->refcount, amdgpu_ctx_fini) != 1)
645			DRM_ERROR("ctx %p is still alive\n", ctx);
646	}
647
648	idr_destroy(&mgr->ctx_handles);
649	mutex_destroy(&mgr->lock);
650}

  1/*
  2 * Copyright 2015 Advanced Micro Devices, Inc.
  3 *
  4 * Permission is hereby granted, free of charge, to any person obtaining a
  5 * copy of this software and associated documentation files (the "Software"),
  6 * to deal in the Software without restriction, including without limitation
  7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8 * and/or sell copies of the Software, and to permit persons to whom the
  9 * Software is furnished to do so, subject to the following conditions:
 10 *
 11 * The above copyright notice and this permission notice shall be included in
 12 * all copies or substantial portions of the Software.
 13 *
 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
 20 * OTHER DEALINGS IN THE SOFTWARE.
 21 *
 22 * Authors: monk liu <monk.liu@amd.com>
 23 */
 24
 25#include <drm/drmP.h>
 26#include "amdgpu.h"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 27
 28static int amdgpu_ctx_init(struct amdgpu_device *adev, struct amdgpu_ctx *ctx)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 29{
 30	unsigned i, j;
 31	int r;
 32
 
 
 
 
 33	memset(ctx, 0, sizeof(*ctx));
 
 34	ctx->adev = adev;
 
 35	kref_init(&ctx->refcount);
 36	spin_lock_init(&ctx->ring_lock);
 37	ctx->fences = kcalloc(amdgpu_sched_jobs * AMDGPU_MAX_RINGS,
 38			      sizeof(struct fence*), GFP_KERNEL);
 39	if (!ctx->fences)
 40		return -ENOMEM;
 41
 42	for (i = 0; i < AMDGPU_MAX_RINGS; ++i) {
 43		ctx->rings[i].sequence = 1;
 44		ctx->rings[i].fences = &ctx->fences[amdgpu_sched_jobs * i];
 45	}
 46	/* create context entity for each ring */
 47	for (i = 0; i < adev->num_rings; i++) {
 48		struct amdgpu_ring *ring = adev->rings[i];
 49		struct amd_sched_rq *rq;
 50
 51		rq = &ring->sched.sched_rq[AMD_SCHED_PRIORITY_NORMAL];
 52		r = amd_sched_entity_init(&ring->sched, &ctx->rings[i].entity,
 53					  rq, amdgpu_sched_jobs);
 54		if (r)
 55			break;
 56	}
 57
 58	if (i < adev->num_rings) {
 59		for (j = 0; j < i; j++)
 60			amd_sched_entity_fini(&adev->rings[j]->sched,
 61					      &ctx->rings[j].entity);
 62		kfree(ctx->fences);
 63		return r;
 64	}
 65	return 0;
 66}
 67
 68static void amdgpu_ctx_fini(struct amdgpu_ctx *ctx)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 69{
 
 70	struct amdgpu_device *adev = ctx->adev;
 71	unsigned i, j;
 72
 73	if (!adev)
 74		return;
 75
 76	for (i = 0; i < AMDGPU_MAX_RINGS; ++i)
 77		for (j = 0; j < amdgpu_sched_jobs; ++j)
 78			fence_put(ctx->rings[i].fences[j]);
 79	kfree(ctx->fences);
 80
 81	for (i = 0; i < adev->num_rings; i++)
 82		amd_sched_entity_fini(&adev->rings[i]->sched,
 83				      &ctx->rings[i].entity);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 84}
 85
 86static int amdgpu_ctx_alloc(struct amdgpu_device *adev,
 87			    struct amdgpu_fpriv *fpriv,
 
 
 88			    uint32_t *id)
 89{
 90	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
 91	struct amdgpu_ctx *ctx;
 92	int r;
 93
 94	ctx = kmalloc(sizeof(*ctx), GFP_KERNEL);
 95	if (!ctx)
 96		return -ENOMEM;
 97
 98	mutex_lock(&mgr->lock);
 99	r = idr_alloc(&mgr->ctx_handles, ctx, 1, 0, GFP_KERNEL);
100	if (r < 0) {
101		mutex_unlock(&mgr->lock);
102		kfree(ctx);
103		return r;
104	}
 
105	*id = (uint32_t)r;
106	r = amdgpu_ctx_init(adev, ctx);
107	if (r) {
108		idr_remove(&mgr->ctx_handles, *id);
109		*id = 0;
110		kfree(ctx);
111	}
112	mutex_unlock(&mgr->lock);
113	return r;
114}
115
116static void amdgpu_ctx_do_release(struct kref *ref)
117{
118	struct amdgpu_ctx *ctx;
 
119
120	ctx = container_of(ref, struct amdgpu_ctx, refcount);
 
 
 
 
121
122	amdgpu_ctx_fini(ctx);
 
 
123
124	kfree(ctx);
125}
126
127static int amdgpu_ctx_free(struct amdgpu_fpriv *fpriv, uint32_t id)
128{
129	struct amdgpu_ctx_mgr *mgr = &fpriv->ctx_mgr;
130	struct amdgpu_ctx *ctx;
131
132	mutex_lock(&mgr->lock);
133	ctx = idr_find(&mgr->ctx_handles, id);
134	if (ctx) {
135		idr_remove(&mgr->ctx_handles, id);
136		kref_put(&ctx->refcount, amdgpu_ctx_do_release);
137		mutex_unlock(&mgr->lock);
138		return 0;
139	}
140	mutex_unlock(&mgr->lock);
141	return -EINVAL;
142}
143
144static int amdgpu_ctx_query(struct amdgpu_device *adev,
145			    struct amdgpu_fpriv *fpriv, uint32_t id,
146			    union drm_amdgpu_ctx_out *out)
147{
148	struct amdgpu_ctx *ctx;
149	struct amdgpu_ctx_mgr *mgr;
150	unsigned reset_counter;
151
152	if (!fpriv)
153		return -EINVAL;
154
155	mgr = &fpriv->ctx_mgr;
156	mutex_lock(&mgr->lock);
157	ctx = idr_find(&mgr->ctx_handles, id);
158	if (!ctx) {
159		mutex_unlock(&mgr->lock);
160		return -EINVAL;
161	}
162
163	/* TODO: these two are always zero */
164	out->state.flags = 0x0;
165	out->state.hangs = 0x0;
166
167	/* determine if a GPU reset has occured since the last call */
168	reset_counter = atomic_read(&adev->gpu_reset_counter);
169	/* TODO: this should ideally return NO, GUILTY, or INNOCENT. */
170	if (ctx->reset_counter == reset_counter)
171		out->state.reset_status = AMDGPU_CTX_NO_RESET;
172	else
173		out->state.reset_status = AMDGPU_CTX_UNKNOWN_RESET;
174	ctx->reset_counter = reset_counter;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
175
176	mutex_unlock(&mgr->lock);
177	return 0;
178}
179
180int amdgpu_ctx_ioctl(struct drm_device *dev, void *data,
181		     struct drm_file *filp)
182{
183	int r;
184	uint32_t id;
 
185
186	union drm_amdgpu_ctx *args = data;
187	struct amdgpu_device *adev = dev->dev_private;
188	struct amdgpu_fpriv *fpriv = filp->driver_priv;
189
190	r = 0;
191	id = args->in.ctx_id;
 
 
 
 
 
 
192
193	switch (args->in.op) {
194	case AMDGPU_CTX_OP_ALLOC_CTX:
195		r = amdgpu_ctx_alloc(adev, fpriv, &id);
196		args->out.alloc.ctx_id = id;
197		break;
198	case AMDGPU_CTX_OP_FREE_CTX:
199		r = amdgpu_ctx_free(fpriv, id);
200		break;
201	case AMDGPU_CTX_OP_QUERY_STATE:
202		r = amdgpu_ctx_query(adev, fpriv, id, &args->out);
203		break;
 
 
 
204	default:
205		return -EINVAL;
206	}
207
208	return r;
209}
210
211struct amdgpu_ctx *amdgpu_ctx_get(struct amdgpu_fpriv *fpriv, uint32_t id)
212{
213	struct amdgpu_ctx *ctx;
214	struct amdgpu_ctx_mgr *mgr;
215
216	if (!fpriv)
217		return NULL;
218
219	mgr = &fpriv->ctx_mgr;
220
221	mutex_lock(&mgr->lock);
222	ctx = idr_find(&mgr->ctx_handles, id);
223	if (ctx)
224		kref_get(&ctx->refcount);
225	mutex_unlock(&mgr->lock);
226	return ctx;
227}
228
229int amdgpu_ctx_put(struct amdgpu_ctx *ctx)
230{
231	if (ctx == NULL)
232		return -EINVAL;
233
234	kref_put(&ctx->refcount, amdgpu_ctx_do_release);
235	return 0;
236}
237
238uint64_t amdgpu_ctx_add_fence(struct amdgpu_ctx *ctx, struct amdgpu_ring *ring,
239			      struct fence *fence)
240{
241	struct amdgpu_ctx_ring *cring = & ctx->rings[ring->idx];
242	uint64_t seq = cring->sequence;
 
 
243	unsigned idx = 0;
244	struct fence *other = NULL;
245
246	idx = seq & (amdgpu_sched_jobs - 1);
247	other = cring->fences[idx];
248	if (other) {
249		signed long r;
250		r = fence_wait_timeout(other, false, MAX_SCHEDULE_TIMEOUT);
251		if (r < 0)
252			DRM_ERROR("Error (%ld) waiting for fence!\n", r);
253	}
254
255	fence_get(fence);
256
257	spin_lock(&ctx->ring_lock);
258	cring->fences[idx] = fence;
259	cring->sequence++;
260	spin_unlock(&ctx->ring_lock);
261
262	fence_put(other);
263
264	return seq;
265}
266
267struct fence *amdgpu_ctx_get_fence(struct amdgpu_ctx *ctx,
268				   struct amdgpu_ring *ring, uint64_t seq)
 
269{
270	struct amdgpu_ctx_ring *cring = & ctx->rings[ring->idx];
271	struct fence *fence;
272
273	spin_lock(&ctx->ring_lock);
274
275	if (seq >= cring->sequence) {
 
 
 
276		spin_unlock(&ctx->ring_lock);
277		return ERR_PTR(-EINVAL);
278	}
279
280
281	if (seq + amdgpu_sched_jobs < cring->sequence) {
282		spin_unlock(&ctx->ring_lock);
283		return NULL;
284	}
285
286	fence = fence_get(cring->fences[seq & (amdgpu_sched_jobs - 1)]);
287	spin_unlock(&ctx->ring_lock);
288
289	return fence;
290}
291
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
292void amdgpu_ctx_mgr_init(struct amdgpu_ctx_mgr *mgr)
293{
294	mutex_init(&mgr->lock);
295	idr_init(&mgr->ctx_handles);
296}
297
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
298void amdgpu_ctx_mgr_fini(struct amdgpu_ctx_mgr *mgr)
299{
300	struct amdgpu_ctx *ctx;
301	struct idr *idp;
302	uint32_t id;
303
 
 
304	idp = &mgr->ctx_handles;
305
306	idr_for_each_entry(idp, ctx, id) {
307		if (kref_put(&ctx->refcount, amdgpu_ctx_do_release) != 1)
308			DRM_ERROR("ctx %p is still alive\n", ctx);
309	}
310
311	idr_destroy(&mgr->ctx_handles);
312	mutex_destroy(&mgr->lock);
313}