v3d_bo.c 7.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299
  1. // SPDX-License-Identifier: GPL-2.0+
  2. /* Copyright (C) 2015-2018 Broadcom */
  3. /**
  4. * DOC: V3D GEM BO management support
  5. *
  6. * Compared to VC4 (V3D 2.x), V3D 3.3 introduces an MMU between the
  7. * GPU and the bus, allowing us to use shmem objects for our storage
  8. * instead of CMA.
  9. *
  10. * Physically contiguous objects may still be imported to V3D, but the
  11. * driver doesn't allocate physically contiguous objects on its own.
  12. * Display engines requiring physically contiguous allocations should
  13. * look into Mesa's "renderonly" support (as used by the Mesa pl111
  14. * driver) for an example of how to integrate with V3D.
  15. *
  16. * Long term, we should support evicting pages from the MMU when under
  17. * memory pressure (thus the v3d_bo_get_pages() refcounting), but
  18. * that's not a high priority since our systems tend to not have swap.
  19. */
  20. #include <linux/dma-buf.h>
  21. #include <linux/pfn_t.h>
  22. #include <linux/vmalloc.h>
  23. #include "v3d_drv.h"
  24. #include "uapi/drm/v3d_drm.h"
  25. static enum drm_gem_object_status v3d_gem_status(struct drm_gem_object *obj)
  26. {
  27. struct v3d_bo *bo = to_v3d_bo(obj);
  28. enum drm_gem_object_status res = 0;
  29. if (bo->base.pages)
  30. res |= DRM_GEM_OBJECT_RESIDENT;
  31. return res;
  32. }
  33. /* Called DRM core on the last userspace/kernel unreference of the
  34. * BO.
  35. */
  36. void v3d_free_object(struct drm_gem_object *obj)
  37. {
  38. struct v3d_dev *v3d = to_v3d_dev(obj->dev);
  39. struct v3d_bo *bo = to_v3d_bo(obj);
  40. if (bo->vaddr)
  41. v3d_put_bo_vaddr(bo);
  42. v3d_mmu_remove_ptes(bo);
  43. mutex_lock(&v3d->bo_lock);
  44. v3d->bo_stats.num_allocated--;
  45. v3d->bo_stats.pages_allocated -= obj->size >> V3D_MMU_PAGE_SHIFT;
  46. mutex_unlock(&v3d->bo_lock);
  47. spin_lock(&v3d->mm_lock);
  48. drm_mm_remove_node(&bo->node);
  49. spin_unlock(&v3d->mm_lock);
  50. /* GPU execution may have dirtied any pages in the BO. */
  51. bo->base.pages_mark_dirty_on_put = true;
  52. drm_gem_shmem_free(&bo->base);
  53. }
  54. static const struct drm_gem_object_funcs v3d_gem_funcs = {
  55. .free = v3d_free_object,
  56. .print_info = drm_gem_shmem_object_print_info,
  57. .pin = drm_gem_shmem_object_pin,
  58. .unpin = drm_gem_shmem_object_unpin,
  59. .get_sg_table = drm_gem_shmem_object_get_sg_table,
  60. .vmap = drm_gem_shmem_object_vmap,
  61. .vunmap = drm_gem_shmem_object_vunmap,
  62. .mmap = drm_gem_shmem_object_mmap,
  63. .status = v3d_gem_status,
  64. .vm_ops = &drm_gem_shmem_vm_ops,
  65. };
  66. /* gem_create_object function for allocating a BO struct and doing
  67. * early setup.
  68. */
  69. struct drm_gem_object *v3d_create_object(struct drm_device *dev, size_t size)
  70. {
  71. struct v3d_bo *bo;
  72. struct drm_gem_object *obj;
  73. if (size == 0)
  74. return ERR_PTR(-EINVAL);
  75. bo = kzalloc(sizeof(*bo), GFP_KERNEL);
  76. if (!bo)
  77. return ERR_PTR(-ENOMEM);
  78. obj = &bo->base.base;
  79. obj->funcs = &v3d_gem_funcs;
  80. bo->base.map_wc = true;
  81. INIT_LIST_HEAD(&bo->unref_head);
  82. return &bo->base.base;
  83. }
  84. static int
  85. v3d_bo_create_finish(struct drm_gem_object *obj)
  86. {
  87. struct v3d_dev *v3d = to_v3d_dev(obj->dev);
  88. struct v3d_bo *bo = to_v3d_bo(obj);
  89. struct sg_table *sgt;
  90. int ret;
  91. /* So far we pin the BO in the MMU for its lifetime, so use
  92. * shmem's helper for getting a lifetime sgt.
  93. */
  94. sgt = drm_gem_shmem_get_pages_sgt(&bo->base);
  95. if (IS_ERR(sgt))
  96. return PTR_ERR(sgt);
  97. spin_lock(&v3d->mm_lock);
  98. /* Allocate the object's space in the GPU's page tables.
  99. * Inserting PTEs will happen later, but the offset is for the
  100. * lifetime of the BO.
  101. */
  102. ret = drm_mm_insert_node_generic(&v3d->mm, &bo->node,
  103. obj->size >> V3D_MMU_PAGE_SHIFT,
  104. GMP_GRANULARITY >> V3D_MMU_PAGE_SHIFT, 0, 0);
  105. spin_unlock(&v3d->mm_lock);
  106. if (ret)
  107. return ret;
  108. /* Track stats for /debug/dri/n/bo_stats. */
  109. mutex_lock(&v3d->bo_lock);
  110. v3d->bo_stats.num_allocated++;
  111. v3d->bo_stats.pages_allocated += obj->size >> V3D_MMU_PAGE_SHIFT;
  112. mutex_unlock(&v3d->bo_lock);
  113. v3d_mmu_insert_ptes(bo);
  114. return 0;
  115. }
  116. struct v3d_bo *v3d_bo_create(struct drm_device *dev, struct drm_file *file_priv,
  117. size_t unaligned_size)
  118. {
  119. struct drm_gem_shmem_object *shmem_obj;
  120. struct v3d_bo *bo;
  121. int ret;
  122. shmem_obj = drm_gem_shmem_create(dev, unaligned_size);
  123. if (IS_ERR(shmem_obj))
  124. return ERR_CAST(shmem_obj);
  125. bo = to_v3d_bo(&shmem_obj->base);
  126. bo->vaddr = NULL;
  127. ret = v3d_bo_create_finish(&shmem_obj->base);
  128. if (ret)
  129. goto free_obj;
  130. return bo;
  131. free_obj:
  132. drm_gem_shmem_free(shmem_obj);
  133. return ERR_PTR(ret);
  134. }
  135. struct drm_gem_object *
  136. v3d_prime_import_sg_table(struct drm_device *dev,
  137. struct dma_buf_attachment *attach,
  138. struct sg_table *sgt)
  139. {
  140. struct drm_gem_object *obj;
  141. int ret;
  142. obj = drm_gem_shmem_prime_import_sg_table(dev, attach, sgt);
  143. if (IS_ERR(obj))
  144. return obj;
  145. ret = v3d_bo_create_finish(obj);
  146. if (ret) {
  147. drm_gem_shmem_free(&to_v3d_bo(obj)->base);
  148. return ERR_PTR(ret);
  149. }
  150. return obj;
  151. }
  152. void v3d_get_bo_vaddr(struct v3d_bo *bo)
  153. {
  154. struct drm_gem_shmem_object *obj = &bo->base;
  155. bo->vaddr = vmap(obj->pages, obj->base.size >> PAGE_SHIFT, VM_MAP,
  156. pgprot_writecombine(PAGE_KERNEL));
  157. }
  158. void v3d_put_bo_vaddr(struct v3d_bo *bo)
  159. {
  160. vunmap(bo->vaddr);
  161. bo->vaddr = NULL;
  162. }
  163. int v3d_create_bo_ioctl(struct drm_device *dev, void *data,
  164. struct drm_file *file_priv)
  165. {
  166. struct drm_v3d_create_bo *args = data;
  167. struct v3d_bo *bo = NULL;
  168. int ret;
  169. if (args->flags != 0) {
  170. DRM_INFO("unknown create_bo flags: %d\n", args->flags);
  171. return -EINVAL;
  172. }
  173. bo = v3d_bo_create(dev, file_priv, PAGE_ALIGN(args->size));
  174. if (IS_ERR(bo))
  175. return PTR_ERR(bo);
  176. args->offset = bo->node.start << V3D_MMU_PAGE_SHIFT;
  177. ret = drm_gem_handle_create(file_priv, &bo->base.base, &args->handle);
  178. drm_gem_object_put(&bo->base.base);
  179. return ret;
  180. }
  181. int v3d_mmap_bo_ioctl(struct drm_device *dev, void *data,
  182. struct drm_file *file_priv)
  183. {
  184. struct drm_v3d_mmap_bo *args = data;
  185. struct drm_gem_object *gem_obj;
  186. if (args->flags != 0) {
  187. DRM_INFO("unknown mmap_bo flags: %d\n", args->flags);
  188. return -EINVAL;
  189. }
  190. gem_obj = drm_gem_object_lookup(file_priv, args->handle);
  191. if (!gem_obj) {
  192. DRM_DEBUG("Failed to look up GEM BO %d\n", args->handle);
  193. return -ENOENT;
  194. }
  195. args->offset = drm_vma_node_offset_addr(&gem_obj->vma_node);
  196. drm_gem_object_put(gem_obj);
  197. return 0;
  198. }
  199. int v3d_get_bo_offset_ioctl(struct drm_device *dev, void *data,
  200. struct drm_file *file_priv)
  201. {
  202. struct drm_v3d_get_bo_offset *args = data;
  203. struct drm_gem_object *gem_obj;
  204. struct v3d_bo *bo;
  205. gem_obj = drm_gem_object_lookup(file_priv, args->handle);
  206. if (!gem_obj) {
  207. DRM_DEBUG("Failed to look up GEM BO %d\n", args->handle);
  208. return -ENOENT;
  209. }
  210. bo = to_v3d_bo(gem_obj);
  211. args->offset = bo->node.start << V3D_MMU_PAGE_SHIFT;
  212. drm_gem_object_put(gem_obj);
  213. return 0;
  214. }
  215. int
  216. v3d_wait_bo_ioctl(struct drm_device *dev, void *data,
  217. struct drm_file *file_priv)
  218. {
  219. int ret;
  220. struct drm_v3d_wait_bo *args = data;
  221. ktime_t start = ktime_get();
  222. u64 delta_ns;
  223. unsigned long timeout_jiffies =
  224. nsecs_to_jiffies_timeout(args->timeout_ns);
  225. if (args->pad != 0)
  226. return -EINVAL;
  227. ret = drm_gem_dma_resv_wait(file_priv, args->handle,
  228. true, timeout_jiffies);
  229. /* Decrement the user's timeout, in case we got interrupted
  230. * such that the ioctl will be restarted.
  231. */
  232. delta_ns = ktime_to_ns(ktime_sub(ktime_get(), start));
  233. if (delta_ns < args->timeout_ns)
  234. args->timeout_ns -= delta_ns;
  235. else
  236. args->timeout_ns = 0;
  237. /* Asked to wait beyond the jiffy/scheduler precision? */
  238. if (ret == -ETIME && args->timeout_ns)
  239. ret = -EAGAIN;
  240. return ret;
  241. }