2 * Copyright (C) 2013 Red Hat
3 * Author: Rob Clark <robdclark@gmail.com>
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 as published by
7 * the Free Software Foundation.
9 * This program is distributed in the hope that it will be useful, but WITHOUT
10 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
11 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
14 * You should have received a copy of the GNU General Public License along with
15 * this program. If not, see <http://www.gnu.org/licenses/>.
18 #include <linux/spinlock.h>
19 #include <linux/shmem_fs.h>
20 #include <linux/dma-buf.h>
27 static dma_addr_t physaddr(struct drm_gem_object *obj)
29 struct msm_gem_object *msm_obj = to_msm_bo(obj);
30 struct msm_drm_private *priv = obj->dev->dev_private;
31 return (((dma_addr_t)msm_obj->vram_node->start) << PAGE_SHIFT) +
35 /* allocate pages from VRAM carveout, used when no IOMMU: */
36 static struct page **get_pages_vram(struct drm_gem_object *obj,
39 struct msm_gem_object *msm_obj = to_msm_bo(obj);
40 struct msm_drm_private *priv = obj->dev->dev_private;
45 p = drm_malloc_ab(npages, sizeof(struct page *));
47 return ERR_PTR(-ENOMEM);
49 ret = drm_mm_insert_node(&priv->vram.mm, msm_obj->vram_node,
50 npages, 0, DRM_MM_SEARCH_DEFAULT);
56 paddr = physaddr(obj);
57 for (i = 0; i < npages; i++) {
58 p[i] = phys_to_page(paddr);
65 /* called with dev->struct_mutex held */
66 static struct page **get_pages(struct drm_gem_object *obj)
68 struct msm_gem_object *msm_obj = to_msm_bo(obj);
70 if (!msm_obj->pages) {
71 struct drm_device *dev = obj->dev;
73 int npages = obj->size >> PAGE_SHIFT;
75 if (iommu_present(&platform_bus_type))
76 p = drm_gem_get_pages(obj, 0);
78 p = get_pages_vram(obj, npages);
81 dev_err(dev->dev, "could not get pages: %ld\n",
86 msm_obj->sgt = drm_prime_pages_to_sg(p, npages);
87 if (IS_ERR(msm_obj->sgt)) {
88 dev_err(dev->dev, "failed to allocate sgt\n");
89 return ERR_CAST(msm_obj->sgt);
94 /* For non-cached buffers, ensure the new pages are clean
95 * because display controller, GPU, etc. are not coherent:
97 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
98 dma_map_sg(dev->dev, msm_obj->sgt->sgl,
99 msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
102 return msm_obj->pages;
105 static void put_pages(struct drm_gem_object *obj)
107 struct msm_gem_object *msm_obj = to_msm_bo(obj);
109 if (msm_obj->pages) {
110 /* For non-cached buffers, ensure the new pages are clean
111 * because display controller, GPU, etc. are not coherent:
113 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED))
114 dma_unmap_sg(obj->dev->dev, msm_obj->sgt->sgl,
115 msm_obj->sgt->nents, DMA_BIDIRECTIONAL);
116 sg_free_table(msm_obj->sgt);
119 if (iommu_present(&platform_bus_type))
120 drm_gem_put_pages(obj, msm_obj->pages, true, false);
122 drm_mm_remove_node(msm_obj->vram_node);
123 drm_free_large(msm_obj->pages);
126 msm_obj->pages = NULL;
130 struct page **msm_gem_get_pages(struct drm_gem_object *obj)
132 struct drm_device *dev = obj->dev;
134 mutex_lock(&dev->struct_mutex);
136 mutex_unlock(&dev->struct_mutex);
140 void msm_gem_put_pages(struct drm_gem_object *obj)
142 /* when we start tracking the pin count, then do something here */
145 int msm_gem_mmap_obj(struct drm_gem_object *obj,
146 struct vm_area_struct *vma)
148 struct msm_gem_object *msm_obj = to_msm_bo(obj);
150 vma->vm_flags &= ~VM_PFNMAP;
151 vma->vm_flags |= VM_MIXEDMAP;
153 if (msm_obj->flags & MSM_BO_WC) {
154 vma->vm_page_prot = pgprot_writecombine(vm_get_page_prot(vma->vm_flags));
155 } else if (msm_obj->flags & MSM_BO_UNCACHED) {
156 vma->vm_page_prot = pgprot_noncached(vm_get_page_prot(vma->vm_flags));
159 * Shunt off cached objs to shmem file so they have their own
160 * address_space (so unmap_mapping_range does what we want,
161 * in particular in the case of mmap'd dmabufs)
166 vma->vm_file = obj->filp;
168 vma->vm_page_prot = vm_get_page_prot(vma->vm_flags);
174 int msm_gem_mmap(struct file *filp, struct vm_area_struct *vma)
178 ret = drm_gem_mmap(filp, vma);
180 DBG("mmap failed: %d", ret);
184 return msm_gem_mmap_obj(vma->vm_private_data, vma);
187 int msm_gem_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
189 struct drm_gem_object *obj = vma->vm_private_data;
190 struct drm_device *dev = obj->dev;
196 /* Make sure we don't parallel update on a fault, nor move or remove
197 * something from beneath our feet
199 ret = mutex_lock_interruptible(&dev->struct_mutex);
203 /* make sure we have pages attached now */
204 pages = get_pages(obj);
206 ret = PTR_ERR(pages);
210 /* We don't use vmf->pgoff since that has the fake offset: */
211 pgoff = ((unsigned long)vmf->virtual_address -
212 vma->vm_start) >> PAGE_SHIFT;
214 pfn = page_to_pfn(pages[pgoff]);
216 VERB("Inserting %p pfn %lx, pa %lx", vmf->virtual_address,
217 pfn, pfn << PAGE_SHIFT);
219 ret = vm_insert_mixed(vma, (unsigned long)vmf->virtual_address, pfn);
222 mutex_unlock(&dev->struct_mutex);
231 * EBUSY is ok: this just means that another thread
232 * already did the job.
234 return VM_FAULT_NOPAGE;
238 return VM_FAULT_SIGBUS;
242 /** get mmap offset */
243 static uint64_t mmap_offset(struct drm_gem_object *obj)
245 struct drm_device *dev = obj->dev;
248 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
250 /* Make it mmapable */
251 ret = drm_gem_create_mmap_offset(obj);
254 dev_err(dev->dev, "could not allocate mmap offset\n");
258 return drm_vma_node_offset_addr(&obj->vma_node);
261 uint64_t msm_gem_mmap_offset(struct drm_gem_object *obj)
264 mutex_lock(&obj->dev->struct_mutex);
265 offset = mmap_offset(obj);
266 mutex_unlock(&obj->dev->struct_mutex);
270 /* should be called under struct_mutex.. although it can be called
271 * from atomic context without struct_mutex to acquire an extra
272 * iova ref if you know one is already held.
274 * That means when I do eventually need to add support for unpinning
275 * the refcnt counter needs to be atomic_t.
277 int msm_gem_get_iova_locked(struct drm_gem_object *obj, int id,
280 struct msm_gem_object *msm_obj = to_msm_bo(obj);
283 if (!msm_obj->domain[id].iova) {
284 struct msm_drm_private *priv = obj->dev->dev_private;
285 struct msm_mmu *mmu = priv->mmus[id];
286 struct page **pages = get_pages(obj);
289 return PTR_ERR(pages);
291 if (iommu_present(&platform_bus_type)) {
292 uint32_t offset = (uint32_t)mmap_offset(obj);
293 ret = mmu->funcs->map(mmu, offset, msm_obj->sgt,
294 obj->size, IOMMU_READ | IOMMU_WRITE);
295 msm_obj->domain[id].iova = offset;
297 msm_obj->domain[id].iova = physaddr(obj);
302 *iova = msm_obj->domain[id].iova;
307 int msm_gem_get_iova(struct drm_gem_object *obj, int id, uint32_t *iova)
309 struct msm_gem_object *msm_obj = to_msm_bo(obj);
312 /* this is safe right now because we don't unmap until the
315 if (msm_obj->domain[id].iova) {
316 *iova = msm_obj->domain[id].iova;
320 mutex_lock(&obj->dev->struct_mutex);
321 ret = msm_gem_get_iova_locked(obj, id, iova);
322 mutex_unlock(&obj->dev->struct_mutex);
326 void msm_gem_put_iova(struct drm_gem_object *obj, int id)
329 // NOTE: probably don't need a _locked() version.. we wouldn't
330 // normally unmap here, but instead just mark that it could be
331 // unmapped (if the iova refcnt drops to zero), but then later
332 // if another _get_iova_locked() fails we can start unmapping
333 // things that are no longer needed..
336 int msm_gem_dumb_create(struct drm_file *file, struct drm_device *dev,
337 struct drm_mode_create_dumb *args)
339 args->pitch = align_pitch(args->width, args->bpp);
340 args->size = PAGE_ALIGN(args->pitch * args->height);
341 return msm_gem_new_handle(dev, file, args->size,
342 MSM_BO_SCANOUT | MSM_BO_WC, &args->handle);
345 int msm_gem_dumb_map_offset(struct drm_file *file, struct drm_device *dev,
346 uint32_t handle, uint64_t *offset)
348 struct drm_gem_object *obj;
351 /* GEM does all our handle to object mapping */
352 obj = drm_gem_object_lookup(dev, file, handle);
358 *offset = msm_gem_mmap_offset(obj);
360 drm_gem_object_unreference_unlocked(obj);
366 void *msm_gem_vaddr_locked(struct drm_gem_object *obj)
368 struct msm_gem_object *msm_obj = to_msm_bo(obj);
369 WARN_ON(!mutex_is_locked(&obj->dev->struct_mutex));
370 if (!msm_obj->vaddr) {
371 struct page **pages = get_pages(obj);
373 return ERR_CAST(pages);
374 msm_obj->vaddr = vmap(pages, obj->size >> PAGE_SHIFT,
375 VM_MAP, pgprot_writecombine(PAGE_KERNEL));
377 return msm_obj->vaddr;
380 void *msm_gem_vaddr(struct drm_gem_object *obj)
383 mutex_lock(&obj->dev->struct_mutex);
384 ret = msm_gem_vaddr_locked(obj);
385 mutex_unlock(&obj->dev->struct_mutex);
389 /* setup callback for when bo is no longer busy..
390 * TODO probably want to differentiate read vs write..
392 int msm_gem_queue_inactive_cb(struct drm_gem_object *obj,
393 struct msm_fence_cb *cb)
395 struct drm_device *dev = obj->dev;
396 struct msm_drm_private *priv = dev->dev_private;
397 struct msm_gem_object *msm_obj = to_msm_bo(obj);
400 mutex_lock(&dev->struct_mutex);
401 if (!list_empty(&cb->work.entry)) {
403 } else if (is_active(msm_obj)) {
404 cb->fence = max(msm_obj->read_fence, msm_obj->write_fence);
405 list_add_tail(&cb->work.entry, &priv->fence_cbs);
407 queue_work(priv->wq, &cb->work);
409 mutex_unlock(&dev->struct_mutex);
414 void msm_gem_move_to_active(struct drm_gem_object *obj,
415 struct msm_gpu *gpu, bool write, uint32_t fence)
417 struct msm_gem_object *msm_obj = to_msm_bo(obj);
420 msm_obj->write_fence = fence;
422 msm_obj->read_fence = fence;
423 list_del_init(&msm_obj->mm_list);
424 list_add_tail(&msm_obj->mm_list, &gpu->active_list);
427 void msm_gem_move_to_inactive(struct drm_gem_object *obj)
429 struct drm_device *dev = obj->dev;
430 struct msm_drm_private *priv = dev->dev_private;
431 struct msm_gem_object *msm_obj = to_msm_bo(obj);
433 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
436 msm_obj->read_fence = 0;
437 msm_obj->write_fence = 0;
438 list_del_init(&msm_obj->mm_list);
439 list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
442 int msm_gem_cpu_prep(struct drm_gem_object *obj, uint32_t op,
443 struct timespec *timeout)
445 struct drm_device *dev = obj->dev;
446 struct msm_gem_object *msm_obj = to_msm_bo(obj);
449 if (is_active(msm_obj)) {
452 if (op & MSM_PREP_READ)
453 fence = msm_obj->write_fence;
454 if (op & MSM_PREP_WRITE)
455 fence = max(fence, msm_obj->read_fence);
456 if (op & MSM_PREP_NOSYNC)
459 ret = msm_wait_fence_interruptable(dev, fence, timeout);
462 /* TODO cache maintenance */
467 int msm_gem_cpu_fini(struct drm_gem_object *obj)
469 /* TODO cache maintenance */
473 #ifdef CONFIG_DEBUG_FS
474 void msm_gem_describe(struct drm_gem_object *obj, struct seq_file *m)
476 struct drm_device *dev = obj->dev;
477 struct msm_gem_object *msm_obj = to_msm_bo(obj);
478 uint64_t off = drm_vma_node_start(&obj->vma_node);
480 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
481 seq_printf(m, "%08x: %c(r=%u,w=%u) %2d (%2d) %08llx %p %d\n",
482 msm_obj->flags, is_active(msm_obj) ? 'A' : 'I',
483 msm_obj->read_fence, msm_obj->write_fence,
484 obj->name, obj->refcount.refcount.counter,
485 off, msm_obj->vaddr, obj->size);
488 void msm_gem_describe_objects(struct list_head *list, struct seq_file *m)
490 struct msm_gem_object *msm_obj;
494 list_for_each_entry(msm_obj, list, mm_list) {
495 struct drm_gem_object *obj = &msm_obj->base;
497 msm_gem_describe(obj, m);
502 seq_printf(m, "Total %d objects, %zu bytes\n", count, size);
506 void msm_gem_free_object(struct drm_gem_object *obj)
508 struct drm_device *dev = obj->dev;
509 struct msm_drm_private *priv = obj->dev->dev_private;
510 struct msm_gem_object *msm_obj = to_msm_bo(obj);
513 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
515 /* object should not be on active list: */
516 WARN_ON(is_active(msm_obj));
518 list_del(&msm_obj->mm_list);
520 for (id = 0; id < ARRAY_SIZE(msm_obj->domain); id++) {
521 struct msm_mmu *mmu = priv->mmus[id];
522 if (mmu && msm_obj->domain[id].iova) {
523 uint32_t offset = (uint32_t)mmap_offset(obj);
524 mmu->funcs->unmap(mmu, offset, msm_obj->sgt, obj->size);
528 drm_gem_free_mmap_offset(obj);
530 if (obj->import_attach) {
532 dma_buf_vunmap(obj->import_attach->dmabuf, msm_obj->vaddr);
534 /* Don't drop the pages for imported dmabuf, as they are not
535 * ours, just free the array we allocated:
538 drm_free_large(msm_obj->pages);
542 vunmap(msm_obj->vaddr);
546 if (msm_obj->resv == &msm_obj->_resv)
547 reservation_object_fini(msm_obj->resv);
549 drm_gem_object_release(obj);
554 /* convenience method to construct a GEM buffer object, and userspace handle */
555 int msm_gem_new_handle(struct drm_device *dev, struct drm_file *file,
556 uint32_t size, uint32_t flags, uint32_t *handle)
558 struct drm_gem_object *obj;
561 ret = mutex_lock_interruptible(&dev->struct_mutex);
565 obj = msm_gem_new(dev, size, flags);
567 mutex_unlock(&dev->struct_mutex);
572 ret = drm_gem_handle_create(file, obj, handle);
574 /* drop reference from allocate - handle holds it now */
575 drm_gem_object_unreference_unlocked(obj);
580 static int msm_gem_new_impl(struct drm_device *dev,
581 uint32_t size, uint32_t flags,
582 struct drm_gem_object **obj)
584 struct msm_drm_private *priv = dev->dev_private;
585 struct msm_gem_object *msm_obj;
588 switch (flags & MSM_BO_CACHE_MASK) {
589 case MSM_BO_UNCACHED:
594 dev_err(dev->dev, "invalid cache flag: %x\n",
595 (flags & MSM_BO_CACHE_MASK));
599 sz = sizeof(*msm_obj);
600 if (!iommu_present(&platform_bus_type))
601 sz += sizeof(struct drm_mm_node);
603 msm_obj = kzalloc(sz, GFP_KERNEL);
607 if (!iommu_present(&platform_bus_type))
608 msm_obj->vram_node = (void *)&msm_obj[1];
610 msm_obj->flags = flags;
612 msm_obj->resv = &msm_obj->_resv;
613 reservation_object_init(msm_obj->resv);
615 INIT_LIST_HEAD(&msm_obj->submit_entry);
616 list_add_tail(&msm_obj->mm_list, &priv->inactive_list);
618 *obj = &msm_obj->base;
623 struct drm_gem_object *msm_gem_new(struct drm_device *dev,
624 uint32_t size, uint32_t flags)
626 struct drm_gem_object *obj = NULL;
629 WARN_ON(!mutex_is_locked(&dev->struct_mutex));
631 size = PAGE_ALIGN(size);
633 ret = msm_gem_new_impl(dev, size, flags, &obj);
637 if (iommu_present(&platform_bus_type)) {
638 ret = drm_gem_object_init(dev, obj, size);
642 drm_gem_private_object_init(dev, obj, size);
649 drm_gem_object_unreference(obj);
654 struct drm_gem_object *msm_gem_import(struct drm_device *dev,
655 uint32_t size, struct sg_table *sgt)
657 struct msm_gem_object *msm_obj;
658 struct drm_gem_object *obj;
661 /* if we don't have IOMMU, don't bother pretending we can import: */
662 if (!iommu_present(&platform_bus_type)) {
663 dev_err(dev->dev, "cannot import without IOMMU\n");
664 return ERR_PTR(-EINVAL);
667 size = PAGE_ALIGN(size);
669 ret = msm_gem_new_impl(dev, size, MSM_BO_WC, &obj);
673 drm_gem_private_object_init(dev, obj, size);
675 npages = size / PAGE_SIZE;
677 msm_obj = to_msm_bo(obj);
679 msm_obj->pages = drm_malloc_ab(npages, sizeof(struct page *));
680 if (!msm_obj->pages) {
685 ret = drm_prime_sg_to_page_addr_arrays(sgt, msm_obj->pages, NULL, npages);
693 drm_gem_object_unreference_unlocked(obj);