Loading...
1/*
2 * Copyright (C) 2013 Red Hat
3 * Author: Rob Clark <robdclark@gmail.com>
4 *
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 as published by
7 * the Free Software Foundation.
8 *
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
13 *
14 * You should have received a copy of the GNU General Public License along with
15 * this program. If not, see <http://www.gnu.org/licenses/>.
16 */
17
18#include <linux/spinlock.h>
19#include <linux/shmem_fs.h>
20#include <linux/dma-buf.h>
21#include <linux/pfn_t.h>
22
23#include "msm_drv.h"
24#include "msm_gem.h"
25#include "msm_gpu.h"
26#include "msm_mmu.h"
27
28static dma_addr_t physaddr(struct drm_gem_object *obj)
29{
30 struct msm_gem_object *msm_obj = to_msm_bo(obj);
31 struct msm_drm_private *priv = obj->dev->dev_private;
32 return (((dma_addr_t)msm_obj->vram_node->start) << PAGE_SHIFT) +
33 priv->vram.paddr;
34}
35
36static bool use_pages(struct drm_gem_object *obj)
37{
38 struct msm_gem_object *msm_obj = to_msm_bo(obj);
39 return !msm_obj->vram_node;
40}
41
42/* allocate pages from VRAM carveout, used when no IOMMU: */
43static struct page **get_pages_vram(struct drm_gem_object *obj,
44 int npages)
45{
46 struct msm_gem_object *msm_obj = to_msm_bo(obj);
47 struct msm_drm_private *priv = obj->dev->dev_private;
48 dma_addr_t paddr;
49 struct page **p;
50 int ret, i;
51
52 p = drm_malloc_ab(npages, sizeof(struct page *));
53 if (!p)
54 return ERR_PTR(-ENOMEM);
55
56 ret = drm_mm_insert_node(&priv->vram.mm, msm_obj->vram_node,
57 npages, 0, DRM_MM_SEARCH_DEFAULT);
58 if (ret) {
59 drm_free_large(p);
60 return ERR_PTR(ret);
61 }
62
63 paddr = physaddr(obj);
64 for (i = 0; i < npages; i++) {
65 p[i] = phys_to_page(paddr);
66 paddr += PAGE_SIZE;
67 }
68
69 return p;
70}
71
72/* called with dev->struct_mutex held */
73static struct page **get_pages(struct drm_gem_object *obj)
74{
75 struct msm_gem_object *msm_obj = to_msm_bo(obj);
76
77 if (!msm_obj->pages) {
78 struct drm_device *dev = obj->dev;
79 struct page **p;
80 int npages = obj->size >> PAGE_SHIFT;
81
82 if (use_pages(obj))
83 p = drm_gem_get_pages(obj);
84 else
85 p = get_pages_vram(obj, npages);
86
87 if (IS_ERR(p)) {
88 dev_err(dev->dev, "could not get pages: %ld\n",
89 PTR_ERR(p));
90 return p;
91 }
92
93 msm_obj->sgt = drm_prime_pages_to_sg(p, npages);
94 if (IS_ERR(msm_obj->sgt)) {
95 dev_err(dev->dev, "failed to allocate sgt\n");
96 return ERR_CAST(msm_obj->sgt);
97 }
98
99 msm_obj->pages = p;
100
101 /* For non-cached buffers, ensure the new pages are clean
102 * because display controller, GPU, etc. are not coherent:
103 */
104 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
105 dma_map_sg(dev->dev, msm_obj->sgt->sgl,
106 msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
107 }
108
109 return msm_obj->pages;
110}
111
112static void put_pages(struct drm_gem_object *obj)
113{
114 struct msm_gem_object *msm_obj = to_msm_bo(obj);
115
116 if (msm_obj->pages) {
117 /* For non-cached buffers, ensure the new pages are clean
118 * because display controller, GPU, etc. are not coherent:
119 */
120 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
121 dma_unmap_sg(obj->dev->dev, msm_obj->sgt->sgl,
122 msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
123 sg_free_table(msm_obj->sgt);
124 kfree(msm_obj->sgt);
125
126 if (use_pages(obj))
127 drm_gem_put_pages(obj, msm_obj->pages, true, false);
128 else {
129 drm_mm_remove_node(msm_obj->vram_node);
130 drm_free_large(msm_obj->pages);
131 }
132
133 msm_obj->pages = NULL;
134 }
135}
136
137struct page **msm_gem_get_pages(struct drm_gem_object *obj)
138{
139 struct drm_device *dev = obj->dev;
140 struct page **p;
141 mutex_lock(&dev->struct_mutex);
142 p = get_pages(obj);
143 mutex_unlock(&dev->struct_mutex);
144 return p;
145}
146
147void msm_gem_put_pages(struct drm_gem_object *obj)
148{
149 /* when we start tracking the pin count, then do something here */
150}
151
152int msm_gem_mmap_obj(struct drm_gem_object *obj,
153 struct vm_area_struct *vma)
154{
155 struct msm_gem_object *msm_obj = to_msm_bo(obj);
156
157 vma->vm_flags &= ~VM_PFNMAP;
158 vma->vm_flags |= VM_MIXEDMAP;
159
160 if (msm_obj->flags & MSM_BO_WC) {
161 vma->vm_page_prot = pgprot_writecombine(vm_get_page_prot(vma->vm_flags));
162 } else if (msm_obj->flags & MSM_BO_UNCACHED) {
163 vma->vm_page_prot = pgprot_noncached(vm_get_page_prot(vma->vm_flags));
164 } else {
165 /*
166 * Shunt off cached objs to shmem file so they have their own
167 * address_space (so unmap_mapping_range does what we want,
168 * in particular in the case of mmap'd dmabufs)
169 */
170 fput(vma->vm_file);
171 get_file(obj->filp);
172 vma->vm_pgoff = 0;
173 vma->vm_file = obj->filp;
174
175 vma->vm_page_prot = vm_get_page_prot(vma->vm_flags);
176 }
177
178 return 0;
179}
180
181int msm_gem_mmap(struct file *filp, struct vm_area_struct *vma)
182{
183 int ret;
184
185 ret = drm_gem_mmap(filp, vma);
186 if (ret) {
187 DBG("mmap failed: %d", ret);
188 return ret;
189 }
190
191 return msm_gem_mmap_obj(vma->vm_private_data, vma);
192}
193
194int msm_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
195{
196 struct drm_gem_object *obj = vma->vm_private_data;
197 struct drm_device *dev = obj->dev;
198 struct page **pages;
199 unsigned long pfn;
200 pgoff_t pgoff;
201 int ret;
202
203 /* Make sure we don't parallel update on a fault, nor move or remove
204 * something from beneath our feet
205 */
206 ret = mutex_lock_interruptible(&dev->struct_mutex);
207 if (ret)
208 goto out;
209
210 /* make sure we have pages attached now */
211 pages = get_pages(obj);
212 if (IS_ERR(pages)) {
213 ret = PTR_ERR(pages);
214 goto out_unlock;
215 }
216
217 /* We don't use vmf->pgoff since that has the fake offset: */
218 pgoff = ((unsigned long)vmf->virtual_address -
219 vma->vm_start) >> PAGE_SHIFT;
220
221 pfn = page_to_pfn(pages[pgoff]);
222
223 VERB("Inserting %p pfn %lx, pa %lx", vmf->virtual_address,
224 pfn, pfn << PAGE_SHIFT);
225
226 ret = vm_insert_mixed(vma, (unsigned long)vmf->virtual_address,
227 __pfn_to_pfn_t(pfn, PFN_DEV));
228
229out_unlock:
230 mutex_unlock(&dev->struct_mutex);
231out:
232 switch (ret) {
233 case -EAGAIN:
234 case 0:
235 case -ERESTARTSYS:
236 case -EINTR:
237 case -EBUSY:
238 /*
239 * EBUSY is ok: this just means that another thread
240 * already did the job.
241 */
242 return VM_FAULT_NOPAGE;
243 case -ENOMEM:
244 return VM_FAULT_OOM;
245 default:
246 return VM_FAULT_SIGBUS;
247 }
248}
249
250/** get mmap offset */
251static uint64_t mmap_offset(struct drm_gem_object *obj)
252{
253 struct drm_device *dev = obj->dev;
254 int ret;
255
256 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
257
258 /* Make it mmapable */
259 ret = drm_gem_create_mmap_offset(obj);
260
261 if (ret) {
262 dev_err(dev->dev, "could not allocate mmap offset\n");
263 return 0;
264 }
265
266 return drm_vma_node_offset_addr(&obj->vma_node);
267}
268
269uint64_t msm_gem_mmap_offset(struct drm_gem_object *obj)
270{
271 uint64_t offset;
272 mutex_lock(&obj->dev->struct_mutex);
273 offset = mmap_offset(obj);
274 mutex_unlock(&obj->dev->struct_mutex);
275 return offset;
276}
277
278/* should be called under struct_mutex.. although it can be called
279 * from atomic context without struct_mutex to acquire an extra
280 * iova ref if you know one is already held.
281 *
282 * That means when I do eventually need to add support for unpinning
283 * the refcnt counter needs to be atomic_t.
284 */
285int msm_gem_get_iova_locked(struct drm_gem_object *obj, int id,
286 uint32_t *iova)
287{
288 struct msm_gem_object *msm_obj = to_msm_bo(obj);
289 int ret = 0;
290
291 if (!msm_obj->domain[id].iova) {
292 struct msm_drm_private *priv = obj->dev->dev_private;
293 struct page **pages = get_pages(obj);
294
295 if (IS_ERR(pages))
296 return PTR_ERR(pages);
297
298 if (iommu_present(&platform_bus_type)) {
299 struct msm_mmu *mmu = priv->mmus[id];
300 uint32_t offset;
301
302 if (WARN_ON(!mmu))
303 return -EINVAL;
304
305 offset = (uint32_t)mmap_offset(obj);
306 ret = mmu->funcs->map(mmu, offset, msm_obj->sgt,
307 obj->size, IOMMU_READ | IOMMU_WRITE);
308 msm_obj->domain[id].iova = offset;
309 } else {
310 msm_obj->domain[id].iova = physaddr(obj);
311 }
312 }
313
314 if (!ret)
315 *iova = msm_obj->domain[id].iova;
316
317 return ret;
318}
319
320/* get iova, taking a reference. Should have a matching put */
321int msm_gem_get_iova(struct drm_gem_object *obj, int id, uint32_t *iova)
322{
323 struct msm_gem_object *msm_obj = to_msm_bo(obj);
324 int ret;
325
326 /* this is safe right now because we don't unmap until the
327 * bo is deleted:
328 */
329 if (msm_obj->domain[id].iova) {
330 *iova = msm_obj->domain[id].iova;
331 return 0;
332 }
333
334 mutex_lock(&obj->dev->struct_mutex);
335 ret = msm_gem_get_iova_locked(obj, id, iova);
336 mutex_unlock(&obj->dev->struct_mutex);
337 return ret;
338}
339
340/* get iova without taking a reference, used in places where you have
341 * already done a 'msm_gem_get_iova()'.
342 */
343uint32_t msm_gem_iova(struct drm_gem_object *obj, int id)
344{
345 struct msm_gem_object *msm_obj = to_msm_bo(obj);
346 WARN_ON(!msm_obj->domain[id].iova);
347 return msm_obj->domain[id].iova;
348}
349
350void msm_gem_put_iova(struct drm_gem_object *obj, int id)
351{
352 // XXX TODO ..
353 // NOTE: probably don't need a _locked() version.. we wouldn't
354 // normally unmap here, but instead just mark that it could be
355 // unmapped (if the iova refcnt drops to zero), but then later
356 // if another _get_iova_locked() fails we can start unmapping
357 // things that are no longer needed..
358}
359
360int msm_gem_dumb_create(struct drm_file *file, struct drm_device *dev,
361 struct drm_mode_create_dumb *args)
362{
363 args->pitch = align_pitch(args->width, args->bpp);
364 args->size = PAGE_ALIGN(args->pitch * args->height);
365 return msm_gem_new_handle(dev, file, args->size,
366 MSM_BO_SCANOUT | MSM_BO_WC, &args->handle);
367}
368
369int msm_gem_dumb_map_offset(struct drm_file *file, struct drm_device *dev,
370 uint32_t handle, uint64_t *offset)
371{
372 struct drm_gem_object *obj;
373 int ret = 0;
374
375 /* GEM does all our handle to object mapping */
376 obj = drm_gem_object_lookup(dev, file, handle);
377 if (obj == NULL) {
378 ret = -ENOENT;
379 goto fail;
380 }
381
382 *offset = msm_gem_mmap_offset(obj);
383
384 drm_gem_object_unreference_unlocked(obj);
385
386fail:
387 return ret;
388}
389
390void *msm_gem_vaddr_locked(struct drm_gem_object *obj)
391{
392 struct msm_gem_object *msm_obj = to_msm_bo(obj);
393 WARN_ON(!mutex_is_locked(&obj->dev->struct_mutex));
394 if (!msm_obj->vaddr) {
395 struct page **pages = get_pages(obj);
396 if (IS_ERR(pages))
397 return ERR_CAST(pages);
398 msm_obj->vaddr = vmap(pages, obj->size >> PAGE_SHIFT,
399 VM_MAP, pgprot_writecombine(PAGE_KERNEL));
400 }
401 return msm_obj->vaddr;
402}
403
404void *msm_gem_vaddr(struct drm_gem_object *obj)
405{
406 void *ret;
407 mutex_lock(&obj->dev->struct_mutex);
408 ret = msm_gem_vaddr_locked(obj);
409 mutex_unlock(&obj->dev->struct_mutex);
410 return ret;
411}
412
413/* setup callback for when bo is no longer busy..
414 * TODO probably want to differentiate read vs write..
415 */
416int msm_gem_queue_inactive_cb(struct drm_gem_object *obj,
417 struct msm_fence_cb *cb)
418{
419 struct msm_gem_object *msm_obj = to_msm_bo(obj);
420 uint32_t fence = msm_gem_fence(msm_obj,
421 MSM_PREP_READ | MSM_PREP_WRITE);
422 return msm_queue_fence_cb(obj->dev, cb, fence);
423}
424
425void msm_gem_move_to_active(struct drm_gem_object *obj,
426 struct msm_gpu *gpu, bool write, uint32_t fence)
427{
428 struct msm_gem_object *msm_obj = to_msm_bo(obj);
429 msm_obj->gpu = gpu;
430 if (write)
431 msm_obj->write_fence = fence;
432 else
433 msm_obj->read_fence = fence;
434 list_del_init(&msm_obj->mm_list);
435 list_add_tail(&msm_obj->mm_list, &gpu->active_list);
436}
437
438void msm_gem_move_to_inactive(struct drm_gem_object *obj)
439{
440 struct drm_device *dev = obj->dev;
441 struct msm_drm_private *priv = dev->dev_private;
442 struct msm_gem_object *msm_obj = to_msm_bo(obj);
443
444 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
445
446 msm_obj->gpu = NULL;
447 msm_obj->read_fence = 0;
448 msm_obj->write_fence = 0;
449 list_del_init(&msm_obj->mm_list);
450 list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
451}
452
453int msm_gem_cpu_prep(struct drm_gem_object *obj, uint32_t op, ktime_t *timeout)
454{
455 struct drm_device *dev = obj->dev;
456 struct msm_gem_object *msm_obj = to_msm_bo(obj);
457 int ret = 0;
458
459 if (is_active(msm_obj)) {
460 uint32_t fence = msm_gem_fence(msm_obj, op);
461
462 if (op & MSM_PREP_NOSYNC)
463 timeout = NULL;
464
465 ret = msm_wait_fence(dev, fence, timeout, true);
466 }
467
468 /* TODO cache maintenance */
469
470 return ret;
471}
472
473int msm_gem_cpu_fini(struct drm_gem_object *obj)
474{
475 /* TODO cache maintenance */
476 return 0;
477}
478
479#ifdef CONFIG_DEBUG_FS
480void msm_gem_describe(struct drm_gem_object *obj, struct seq_file *m)
481{
482 struct drm_device *dev = obj->dev;
483 struct msm_gem_object *msm_obj = to_msm_bo(obj);
484 uint64_t off = drm_vma_node_start(&obj->vma_node);
485
486 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
487 seq_printf(m, "%08x: %c(r=%u,w=%u) %2d (%2d) %08llx %p %zu\n",
488 msm_obj->flags, is_active(msm_obj) ? 'A' : 'I',
489 msm_obj->read_fence, msm_obj->write_fence,
490 obj->name, obj->refcount.refcount.counter,
491 off, msm_obj->vaddr, obj->size);
492}
493
494void msm_gem_describe_objects(struct list_head *list, struct seq_file *m)
495{
496 struct msm_gem_object *msm_obj;
497 int count = 0;
498 size_t size = 0;
499
500 list_for_each_entry(msm_obj, list, mm_list) {
501 struct drm_gem_object *obj = &msm_obj->base;
502 seq_printf(m, " ");
503 msm_gem_describe(obj, m);
504 count++;
505 size += obj->size;
506 }
507
508 seq_printf(m, "Total %d objects, %zu bytes\n", count, size);
509}
510#endif
511
512void msm_gem_free_object(struct drm_gem_object *obj)
513{
514 struct drm_device *dev = obj->dev;
515 struct msm_drm_private *priv = obj->dev->dev_private;
516 struct msm_gem_object *msm_obj = to_msm_bo(obj);
517 int id;
518
519 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
520
521 /* object should not be on active list: */
522 WARN_ON(is_active(msm_obj));
523
524 list_del(&msm_obj->mm_list);
525
526 for (id = 0; id < ARRAY_SIZE(msm_obj->domain); id++) {
527 struct msm_mmu *mmu = priv->mmus[id];
528 if (mmu && msm_obj->domain[id].iova) {
529 uint32_t offset = msm_obj->domain[id].iova;
530 mmu->funcs->unmap(mmu, offset, msm_obj->sgt, obj->size);
531 }
532 }
533
534 if (obj->import_attach) {
535 if (msm_obj->vaddr)
536 dma_buf_vunmap(obj->import_attach->dmabuf, msm_obj->vaddr);
537
538 /* Don't drop the pages for imported dmabuf, as they are not
539 * ours, just free the array we allocated:
540 */
541 if (msm_obj->pages)
542 drm_free_large(msm_obj->pages);
543
544 drm_prime_gem_destroy(obj, msm_obj->sgt);
545 } else {
546 vunmap(msm_obj->vaddr);
547 put_pages(obj);
548 }
549
550 if (msm_obj->resv == &msm_obj->_resv)
551 reservation_object_fini(msm_obj->resv);
552
553 drm_gem_object_release(obj);
554
555 kfree(msm_obj);
556}
557
558/* convenience method to construct a GEM buffer object, and userspace handle */
559int msm_gem_new_handle(struct drm_device *dev, struct drm_file *file,
560 uint32_t size, uint32_t flags, uint32_t *handle)
561{
562 struct drm_gem_object *obj;
563 int ret;
564
565 ret = mutex_lock_interruptible(&dev->struct_mutex);
566 if (ret)
567 return ret;
568
569 obj = msm_gem_new(dev, size, flags);
570
571 mutex_unlock(&dev->struct_mutex);
572
573 if (IS_ERR(obj))
574 return PTR_ERR(obj);
575
576 ret = drm_gem_handle_create(file, obj, handle);
577
578 /* drop reference from allocate - handle holds it now */
579 drm_gem_object_unreference_unlocked(obj);
580
581 return ret;
582}
583
584static int msm_gem_new_impl(struct drm_device *dev,
585 uint32_t size, uint32_t flags,
586 struct drm_gem_object **obj)
587{
588 struct msm_drm_private *priv = dev->dev_private;
589 struct msm_gem_object *msm_obj;
590 unsigned sz;
591 bool use_vram = false;
592
593 switch (flags & MSM_BO_CACHE_MASK) {
594 case MSM_BO_UNCACHED:
595 case MSM_BO_CACHED:
596 case MSM_BO_WC:
597 break;
598 default:
599 dev_err(dev->dev, "invalid cache flag: %x\n",
600 (flags & MSM_BO_CACHE_MASK));
601 return -EINVAL;
602 }
603
604 if (!iommu_present(&platform_bus_type))
605 use_vram = true;
606 else if ((flags & MSM_BO_STOLEN) && priv->vram.size)
607 use_vram = true;
608
609 if (WARN_ON(use_vram && !priv->vram.size))
610 return -EINVAL;
611
612 sz = sizeof(*msm_obj);
613 if (use_vram)
614 sz += sizeof(struct drm_mm_node);
615
616 msm_obj = kzalloc(sz, GFP_KERNEL);
617 if (!msm_obj)
618 return -ENOMEM;
619
620 if (use_vram)
621 msm_obj->vram_node = (void *)&msm_obj[1];
622
623 msm_obj->flags = flags;
624
625 msm_obj->resv = &msm_obj->_resv;
626 reservation_object_init(msm_obj->resv);
627
628 INIT_LIST_HEAD(&msm_obj->submit_entry);
629 list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
630
631 *obj = &msm_obj->base;
632
633 return 0;
634}
635
636struct drm_gem_object *msm_gem_new(struct drm_device *dev,
637 uint32_t size, uint32_t flags)
638{
639 struct drm_gem_object *obj = NULL;
640 int ret;
641
642 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
643
644 size = PAGE_ALIGN(size);
645
646 ret = msm_gem_new_impl(dev, size, flags, &obj);
647 if (ret)
648 goto fail;
649
650 if (use_pages(obj)) {
651 ret = drm_gem_object_init(dev, obj, size);
652 if (ret)
653 goto fail;
654 } else {
655 drm_gem_private_object_init(dev, obj, size);
656 }
657
658 return obj;
659
660fail:
661 if (obj)
662 drm_gem_object_unreference(obj);
663
664 return ERR_PTR(ret);
665}
666
667struct drm_gem_object *msm_gem_import(struct drm_device *dev,
668 uint32_t size, struct sg_table *sgt)
669{
670 struct msm_gem_object *msm_obj;
671 struct drm_gem_object *obj;
672 int ret, npages;
673
674 /* if we don't have IOMMU, don't bother pretending we can import: */
675 if (!iommu_present(&platform_bus_type)) {
676 dev_err(dev->dev, "cannot import without IOMMU\n");
677 return ERR_PTR(-EINVAL);
678 }
679
680 size = PAGE_ALIGN(size);
681
682 ret = msm_gem_new_impl(dev, size, MSM_BO_WC, &obj);
683 if (ret)
684 goto fail;
685
686 drm_gem_private_object_init(dev, obj, size);
687
688 npages = size / PAGE_SIZE;
689
690 msm_obj = to_msm_bo(obj);
691 msm_obj->sgt = sgt;
692 msm_obj->pages = drm_malloc_ab(npages, sizeof(struct page *));
693 if (!msm_obj->pages) {
694 ret = -ENOMEM;
695 goto fail;
696 }
697
698 ret = drm_prime_sg_to_page_addr_arrays(sgt, msm_obj->pages, NULL, npages);
699 if (ret)
700 goto fail;
701
702 return obj;
703
704fail:
705 if (obj)
706 drm_gem_object_unreference_unlocked(obj);
707
708 return ERR_PTR(ret);
709}
1/*
2 * Copyright (C) 2013 Red Hat
3 * Author: Rob Clark <robdclark@gmail.com>
4 *
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 as published by
7 * the Free Software Foundation.
8 *
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
12 * more details.
13 *
14 * You should have received a copy of the GNU General Public License along with
15 * this program. If not, see <http://www.gnu.org/licenses/>.
16 */
17
18#include <linux/spinlock.h>
19#include <linux/shmem_fs.h>
20#include <linux/dma-buf.h>
21
22#include "msm_drv.h"
23#include "msm_gem.h"
24#include "msm_gpu.h"
25#include "msm_mmu.h"
26
27static dma_addr_t physaddr(struct drm_gem_object *obj)
28{
29 struct msm_gem_object *msm_obj = to_msm_bo(obj);
30 struct msm_drm_private *priv = obj->dev->dev_private;
31 return (((dma_addr_t)msm_obj->vram_node->start) << PAGE_SHIFT) +
32 priv->vram.paddr;
33}
34
35/* allocate pages from VRAM carveout, used when no IOMMU: */
36static struct page **get_pages_vram(struct drm_gem_object *obj,
37 int npages)
38{
39 struct msm_gem_object *msm_obj = to_msm_bo(obj);
40 struct msm_drm_private *priv = obj->dev->dev_private;
41 dma_addr_t paddr;
42 struct page **p;
43 int ret, i;
44
45 p = drm_malloc_ab(npages, sizeof(struct page *));
46 if (!p)
47 return ERR_PTR(-ENOMEM);
48
49 ret = drm_mm_insert_node(&priv->vram.mm, msm_obj->vram_node,
50 npages, 0, DRM_MM_SEARCH_DEFAULT);
51 if (ret) {
52 drm_free_large(p);
53 return ERR_PTR(ret);
54 }
55
56 paddr = physaddr(obj);
57 for (i = 0; i < npages; i++) {
58 p[i] = phys_to_page(paddr);
59 paddr += PAGE_SIZE;
60 }
61
62 return p;
63}
64
65/* called with dev->struct_mutex held */
66static struct page **get_pages(struct drm_gem_object *obj)
67{
68 struct msm_gem_object *msm_obj = to_msm_bo(obj);
69
70 if (!msm_obj->pages) {
71 struct drm_device *dev = obj->dev;
72 struct page **p;
73 int npages = obj->size >> PAGE_SHIFT;
74
75 if (iommu_present(&platform_bus_type))
76 p = drm_gem_get_pages(obj, 0);
77 else
78 p = get_pages_vram(obj, npages);
79
80 if (IS_ERR(p)) {
81 dev_err(dev->dev, "could not get pages: %ld\n",
82 PTR_ERR(p));
83 return p;
84 }
85
86 msm_obj->sgt = drm_prime_pages_to_sg(p, npages);
87 if (IS_ERR(msm_obj->sgt)) {
88 dev_err(dev->dev, "failed to allocate sgt\n");
89 return ERR_CAST(msm_obj->sgt);
90 }
91
92 msm_obj->pages = p;
93
94 /* For non-cached buffers, ensure the new pages are clean
95 * because display controller, GPU, etc. are not coherent:
96 */
97 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
98 dma_map_sg(dev->dev, msm_obj->sgt->sgl,
99 msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
100 }
101
102 return msm_obj->pages;
103}
104
105static void put_pages(struct drm_gem_object *obj)
106{
107 struct msm_gem_object *msm_obj = to_msm_bo(obj);
108
109 if (msm_obj->pages) {
110 /* For non-cached buffers, ensure the new pages are clean
111 * because display controller, GPU, etc. are not coherent:
112 */
113 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
114 dma_unmap_sg(obj->dev->dev, msm_obj->sgt->sgl,
115 msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
116 sg_free_table(msm_obj->sgt);
117 kfree(msm_obj->sgt);
118
119 if (iommu_present(&platform_bus_type))
120 drm_gem_put_pages(obj, msm_obj->pages, true, false);
121 else {
122 drm_mm_remove_node(msm_obj->vram_node);
123 drm_free_large(msm_obj->pages);
124 }
125
126 msm_obj->pages = NULL;
127 }
128}
129
130struct page **msm_gem_get_pages(struct drm_gem_object *obj)
131{
132 struct drm_device *dev = obj->dev;
133 struct page **p;
134 mutex_lock(&dev->struct_mutex);
135 p = get_pages(obj);
136 mutex_unlock(&dev->struct_mutex);
137 return p;
138}
139
140void msm_gem_put_pages(struct drm_gem_object *obj)
141{
142 /* when we start tracking the pin count, then do something here */
143}
144
145int msm_gem_mmap_obj(struct drm_gem_object *obj,
146 struct vm_area_struct *vma)
147{
148 struct msm_gem_object *msm_obj = to_msm_bo(obj);
149
150 vma->vm_flags &= ~VM_PFNMAP;
151 vma->vm_flags |= VM_MIXEDMAP;
152
153 if (msm_obj->flags & MSM_BO_WC) {
154 vma->vm_page_prot = pgprot_writecombine(vm_get_page_prot(vma->vm_flags));
155 } else if (msm_obj->flags & MSM_BO_UNCACHED) {
156 vma->vm_page_prot = pgprot_noncached(vm_get_page_prot(vma->vm_flags));
157 } else {
158 /*
159 * Shunt off cached objs to shmem file so they have their own
160 * address_space (so unmap_mapping_range does what we want,
161 * in particular in the case of mmap'd dmabufs)
162 */
163 fput(vma->vm_file);
164 get_file(obj->filp);
165 vma->vm_pgoff = 0;
166 vma->vm_file = obj->filp;
167
168 vma->vm_page_prot = vm_get_page_prot(vma->vm_flags);
169 }
170
171 return 0;
172}
173
174int msm_gem_mmap(struct file *filp, struct vm_area_struct *vma)
175{
176 int ret;
177
178 ret = drm_gem_mmap(filp, vma);
179 if (ret) {
180 DBG("mmap failed: %d", ret);
181 return ret;
182 }
183
184 return msm_gem_mmap_obj(vma->vm_private_data, vma);
185}
186
187int msm_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
188{
189 struct drm_gem_object *obj = vma->vm_private_data;
190 struct drm_device *dev = obj->dev;
191 struct page **pages;
192 unsigned long pfn;
193 pgoff_t pgoff;
194 int ret;
195
196 /* Make sure we don't parallel update on a fault, nor move or remove
197 * something from beneath our feet
198 */
199 ret = mutex_lock_interruptible(&dev->struct_mutex);
200 if (ret)
201 goto out;
202
203 /* make sure we have pages attached now */
204 pages = get_pages(obj);
205 if (IS_ERR(pages)) {
206 ret = PTR_ERR(pages);
207 goto out_unlock;
208 }
209
210 /* We don't use vmf->pgoff since that has the fake offset: */
211 pgoff = ((unsigned long)vmf->virtual_address -
212 vma->vm_start) >> PAGE_SHIFT;
213
214 pfn = page_to_pfn(pages[pgoff]);
215
216 VERB("Inserting %p pfn %lx, pa %lx", vmf->virtual_address,
217 pfn, pfn << PAGE_SHIFT);
218
219 ret = vm_insert_mixed(vma, (unsigned long)vmf->virtual_address, pfn);
220
221out_unlock:
222 mutex_unlock(&dev->struct_mutex);
223out:
224 switch (ret) {
225 case -EAGAIN:
226 case 0:
227 case -ERESTARTSYS:
228 case -EINTR:
229 case -EBUSY:
230 /*
231 * EBUSY is ok: this just means that another thread
232 * already did the job.
233 */
234 return VM_FAULT_NOPAGE;
235 case -ENOMEM:
236 return VM_FAULT_OOM;
237 default:
238 return VM_FAULT_SIGBUS;
239 }
240}
241
242/** get mmap offset */
243static uint64_t mmap_offset(struct drm_gem_object *obj)
244{
245 struct drm_device *dev = obj->dev;
246 int ret;
247
248 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
249
250 /* Make it mmapable */
251 ret = drm_gem_create_mmap_offset(obj);
252
253 if (ret) {
254 dev_err(dev->dev, "could not allocate mmap offset\n");
255 return 0;
256 }
257
258 return drm_vma_node_offset_addr(&obj->vma_node);
259}
260
261uint64_t msm_gem_mmap_offset(struct drm_gem_object *obj)
262{
263 uint64_t offset;
264 mutex_lock(&obj->dev->struct_mutex);
265 offset = mmap_offset(obj);
266 mutex_unlock(&obj->dev->struct_mutex);
267 return offset;
268}
269
270/* should be called under struct_mutex.. although it can be called
271 * from atomic context without struct_mutex to acquire an extra
272 * iova ref if you know one is already held.
273 *
274 * That means when I do eventually need to add support for unpinning
275 * the refcnt counter needs to be atomic_t.
276 */
277int msm_gem_get_iova_locked(struct drm_gem_object *obj, int id,
278 uint32_t *iova)
279{
280 struct msm_gem_object *msm_obj = to_msm_bo(obj);
281 int ret = 0;
282
283 if (!msm_obj->domain[id].iova) {
284 struct msm_drm_private *priv = obj->dev->dev_private;
285 struct msm_mmu *mmu = priv->mmus[id];
286 struct page **pages = get_pages(obj);
287
288 if (IS_ERR(pages))
289 return PTR_ERR(pages);
290
291 if (iommu_present(&platform_bus_type)) {
292 uint32_t offset = (uint32_t)mmap_offset(obj);
293 ret = mmu->funcs->map(mmu, offset, msm_obj->sgt,
294 obj->size, IOMMU_READ | IOMMU_WRITE);
295 msm_obj->domain[id].iova = offset;
296 } else {
297 msm_obj->domain[id].iova = physaddr(obj);
298 }
299 }
300
301 if (!ret)
302 *iova = msm_obj->domain[id].iova;
303
304 return ret;
305}
306
307int msm_gem_get_iova(struct drm_gem_object *obj, int id, uint32_t *iova)
308{
309 struct msm_gem_object *msm_obj = to_msm_bo(obj);
310 int ret;
311
312 /* this is safe right now because we don't unmap until the
313 * bo is deleted:
314 */
315 if (msm_obj->domain[id].iova) {
316 *iova = msm_obj->domain[id].iova;
317 return 0;
318 }
319
320 mutex_lock(&obj->dev->struct_mutex);
321 ret = msm_gem_get_iova_locked(obj, id, iova);
322 mutex_unlock(&obj->dev->struct_mutex);
323 return ret;
324}
325
326void msm_gem_put_iova(struct drm_gem_object *obj, int id)
327{
328 // XXX TODO ..
329 // NOTE: probably don't need a _locked() version.. we wouldn't
330 // normally unmap here, but instead just mark that it could be
331 // unmapped (if the iova refcnt drops to zero), but then later
332 // if another _get_iova_locked() fails we can start unmapping
333 // things that are no longer needed..
334}
335
336int msm_gem_dumb_create(struct drm_file *file, struct drm_device *dev,
337 struct drm_mode_create_dumb *args)
338{
339 args->pitch = align_pitch(args->width, args->bpp);
340 args->size = PAGE_ALIGN(args->pitch * args->height);
341 return msm_gem_new_handle(dev, file, args->size,
342 MSM_BO_SCANOUT | MSM_BO_WC, &args->handle);
343}
344
345int msm_gem_dumb_map_offset(struct drm_file *file, struct drm_device *dev,
346 uint32_t handle, uint64_t *offset)
347{
348 struct drm_gem_object *obj;
349 int ret = 0;
350
351 /* GEM does all our handle to object mapping */
352 obj = drm_gem_object_lookup(dev, file, handle);
353 if (obj == NULL) {
354 ret = -ENOENT;
355 goto fail;
356 }
357
358 *offset = msm_gem_mmap_offset(obj);
359
360 drm_gem_object_unreference_unlocked(obj);
361
362fail:
363 return ret;
364}
365
366void *msm_gem_vaddr_locked(struct drm_gem_object *obj)
367{
368 struct msm_gem_object *msm_obj = to_msm_bo(obj);
369 WARN_ON(!mutex_is_locked(&obj->dev->struct_mutex));
370 if (!msm_obj->vaddr) {
371 struct page **pages = get_pages(obj);
372 if (IS_ERR(pages))
373 return ERR_CAST(pages);
374 msm_obj->vaddr = vmap(pages, obj->size >> PAGE_SHIFT,
375 VM_MAP, pgprot_writecombine(PAGE_KERNEL));
376 }
377 return msm_obj->vaddr;
378}
379
380void *msm_gem_vaddr(struct drm_gem_object *obj)
381{
382 void *ret;
383 mutex_lock(&obj->dev->struct_mutex);
384 ret = msm_gem_vaddr_locked(obj);
385 mutex_unlock(&obj->dev->struct_mutex);
386 return ret;
387}
388
389/* setup callback for when bo is no longer busy..
390 * TODO probably want to differentiate read vs write..
391 */
392int msm_gem_queue_inactive_cb(struct drm_gem_object *obj,
393 struct msm_fence_cb *cb)
394{
395 struct drm_device *dev = obj->dev;
396 struct msm_drm_private *priv = dev->dev_private;
397 struct msm_gem_object *msm_obj = to_msm_bo(obj);
398 int ret = 0;
399
400 mutex_lock(&dev->struct_mutex);
401 if (!list_empty(&cb->work.entry)) {
402 ret = -EINVAL;
403 } else if (is_active(msm_obj)) {
404 cb->fence = max(msm_obj->read_fence, msm_obj->write_fence);
405 list_add_tail(&cb->work.entry, &priv->fence_cbs);
406 } else {
407 queue_work(priv->wq, &cb->work);
408 }
409 mutex_unlock(&dev->struct_mutex);
410
411 return ret;
412}
413
414void msm_gem_move_to_active(struct drm_gem_object *obj,
415 struct msm_gpu *gpu, bool write, uint32_t fence)
416{
417 struct msm_gem_object *msm_obj = to_msm_bo(obj);
418 msm_obj->gpu = gpu;
419 if (write)
420 msm_obj->write_fence = fence;
421 else
422 msm_obj->read_fence = fence;
423 list_del_init(&msm_obj->mm_list);
424 list_add_tail(&msm_obj->mm_list, &gpu->active_list);
425}
426
427void msm_gem_move_to_inactive(struct drm_gem_object *obj)
428{
429 struct drm_device *dev = obj->dev;
430 struct msm_drm_private *priv = dev->dev_private;
431 struct msm_gem_object *msm_obj = to_msm_bo(obj);
432
433 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
434
435 msm_obj->gpu = NULL;
436 msm_obj->read_fence = 0;
437 msm_obj->write_fence = 0;
438 list_del_init(&msm_obj->mm_list);
439 list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
440}
441
442int msm_gem_cpu_prep(struct drm_gem_object *obj, uint32_t op,
443 struct timespec *timeout)
444{
445 struct drm_device *dev = obj->dev;
446 struct msm_gem_object *msm_obj = to_msm_bo(obj);
447 int ret = 0;
448
449 if (is_active(msm_obj)) {
450 uint32_t fence = 0;
451
452 if (op & MSM_PREP_READ)
453 fence = msm_obj->write_fence;
454 if (op & MSM_PREP_WRITE)
455 fence = max(fence, msm_obj->read_fence);
456 if (op & MSM_PREP_NOSYNC)
457 timeout = NULL;
458
459 ret = msm_wait_fence_interruptable(dev, fence, timeout);
460 }
461
462 /* TODO cache maintenance */
463
464 return ret;
465}
466
467int msm_gem_cpu_fini(struct drm_gem_object *obj)
468{
469 /* TODO cache maintenance */
470 return 0;
471}
472
473#ifdef CONFIG_DEBUG_FS
474void msm_gem_describe(struct drm_gem_object *obj, struct seq_file *m)
475{
476 struct drm_device *dev = obj->dev;
477 struct msm_gem_object *msm_obj = to_msm_bo(obj);
478 uint64_t off = drm_vma_node_start(&obj->vma_node);
479
480 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
481 seq_printf(m, "%08x: %c(r=%u,w=%u) %2d (%2d) %08llx %p %d\n",
482 msm_obj->flags, is_active(msm_obj) ? 'A' : 'I',
483 msm_obj->read_fence, msm_obj->write_fence,
484 obj->name, obj->refcount.refcount.counter,
485 off, msm_obj->vaddr, obj->size);
486}
487
488void msm_gem_describe_objects(struct list_head *list, struct seq_file *m)
489{
490 struct msm_gem_object *msm_obj;
491 int count = 0;
492 size_t size = 0;
493
494 list_for_each_entry(msm_obj, list, mm_list) {
495 struct drm_gem_object *obj = &msm_obj->base;
496 seq_printf(m, " ");
497 msm_gem_describe(obj, m);
498 count++;
499 size += obj->size;
500 }
501
502 seq_printf(m, "Total %d objects, %zu bytes\n", count, size);
503}
504#endif
505
506void msm_gem_free_object(struct drm_gem_object *obj)
507{
508 struct drm_device *dev = obj->dev;
509 struct msm_drm_private *priv = obj->dev->dev_private;
510 struct msm_gem_object *msm_obj = to_msm_bo(obj);
511 int id;
512
513 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
514
515 /* object should not be on active list: */
516 WARN_ON(is_active(msm_obj));
517
518 list_del(&msm_obj->mm_list);
519
520 for (id = 0; id < ARRAY_SIZE(msm_obj->domain); id++) {
521 struct msm_mmu *mmu = priv->mmus[id];
522 if (mmu && msm_obj->domain[id].iova) {
523 uint32_t offset = (uint32_t)mmap_offset(obj);
524 mmu->funcs->unmap(mmu, offset, msm_obj->sgt, obj->size);
525 }
526 }
527
528 drm_gem_free_mmap_offset(obj);
529
530 if (obj->import_attach) {
531 if (msm_obj->vaddr)
532 dma_buf_vunmap(obj->import_attach->dmabuf, msm_obj->vaddr);
533
534 /* Don't drop the pages for imported dmabuf, as they are not
535 * ours, just free the array we allocated:
536 */
537 if (msm_obj->pages)
538 drm_free_large(msm_obj->pages);
539
540 } else {
541 if (msm_obj->vaddr)
542 vunmap(msm_obj->vaddr);
543 put_pages(obj);
544 }
545
546 if (msm_obj->resv == &msm_obj->_resv)
547 reservation_object_fini(msm_obj->resv);
548
549 drm_gem_object_release(obj);
550
551 kfree(msm_obj);
552}
553
554/* convenience method to construct a GEM buffer object, and userspace handle */
555int msm_gem_new_handle(struct drm_device *dev, struct drm_file *file,
556 uint32_t size, uint32_t flags, uint32_t *handle)
557{
558 struct drm_gem_object *obj;
559 int ret;
560
561 ret = mutex_lock_interruptible(&dev->struct_mutex);
562 if (ret)
563 return ret;
564
565 obj = msm_gem_new(dev, size, flags);
566
567 mutex_unlock(&dev->struct_mutex);
568
569 if (IS_ERR(obj))
570 return PTR_ERR(obj);
571
572 ret = drm_gem_handle_create(file, obj, handle);
573
574 /* drop reference from allocate - handle holds it now */
575 drm_gem_object_unreference_unlocked(obj);
576
577 return ret;
578}
579
580static int msm_gem_new_impl(struct drm_device *dev,
581 uint32_t size, uint32_t flags,
582 struct drm_gem_object **obj)
583{
584 struct msm_drm_private *priv = dev->dev_private;
585 struct msm_gem_object *msm_obj;
586 unsigned sz;
587
588 switch (flags & MSM_BO_CACHE_MASK) {
589 case MSM_BO_UNCACHED:
590 case MSM_BO_CACHED:
591 case MSM_BO_WC:
592 break;
593 default:
594 dev_err(dev->dev, "invalid cache flag: %x\n",
595 (flags & MSM_BO_CACHE_MASK));
596 return -EINVAL;
597 }
598
599 sz = sizeof(*msm_obj);
600 if (!iommu_present(&platform_bus_type))
601 sz += sizeof(struct drm_mm_node);
602
603 msm_obj = kzalloc(sz, GFP_KERNEL);
604 if (!msm_obj)
605 return -ENOMEM;
606
607 if (!iommu_present(&platform_bus_type))
608 msm_obj->vram_node = (void *)&msm_obj[1];
609
610 msm_obj->flags = flags;
611
612 msm_obj->resv = &msm_obj->_resv;
613 reservation_object_init(msm_obj->resv);
614
615 INIT_LIST_HEAD(&msm_obj->submit_entry);
616 list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
617
618 *obj = &msm_obj->base;
619
620 return 0;
621}
622
623struct drm_gem_object *msm_gem_new(struct drm_device *dev,
624 uint32_t size, uint32_t flags)
625{
626 struct drm_gem_object *obj = NULL;
627 int ret;
628
629 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
630
631 size = PAGE_ALIGN(size);
632
633 ret = msm_gem_new_impl(dev, size, flags, &obj);
634 if (ret)
635 goto fail;
636
637 if (iommu_present(&platform_bus_type)) {
638 ret = drm_gem_object_init(dev, obj, size);
639 if (ret)
640 goto fail;
641 } else {
642 drm_gem_private_object_init(dev, obj, size);
643 }
644
645 return obj;
646
647fail:
648 if (obj)
649 drm_gem_object_unreference(obj);
650
651 return ERR_PTR(ret);
652}
653
654struct drm_gem_object *msm_gem_import(struct drm_device *dev,
655 uint32_t size, struct sg_table *sgt)
656{
657 struct msm_gem_object *msm_obj;
658 struct drm_gem_object *obj;
659 int ret, npages;
660
661 /* if we don't have IOMMU, don't bother pretending we can import: */
662 if (!iommu_present(&platform_bus_type)) {
663 dev_err(dev->dev, "cannot import without IOMMU\n");
664 return ERR_PTR(-EINVAL);
665 }
666
667 size = PAGE_ALIGN(size);
668
669 ret = msm_gem_new_impl(dev, size, MSM_BO_WC, &obj);
670 if (ret)
671 goto fail;
672
673 drm_gem_private_object_init(dev, obj, size);
674
675 npages = size / PAGE_SIZE;
676
677 msm_obj = to_msm_bo(obj);
678 msm_obj->sgt = sgt;
679 msm_obj->pages = drm_malloc_ab(npages, sizeof(struct page *));
680 if (!msm_obj->pages) {
681 ret = -ENOMEM;
682 goto fail;
683 }
684
685 ret = drm_prime_sg_to_page_addr_arrays(sgt, msm_obj->pages, NULL, npages);
686 if (ret)
687 goto fail;
688
689 return obj;
690
691fail:
692 if (obj)
693 drm_gem_object_unreference_unlocked(obj);
694
695 return ERR_PTR(ret);
696}