lima_gem.c 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419
  1. // SPDX-License-Identifier: GPL-2.0 OR MIT
  2. /* Copyright 2017-2019 Qiang Yu <[email protected]> */
  3. #include <linux/mm.h>
  4. #include <linux/iosys-map.h>
  5. #include <linux/sync_file.h>
  6. #include <linux/pagemap.h>
  7. #include <linux/shmem_fs.h>
  8. #include <linux/dma-mapping.h>
  9. #include <drm/drm_file.h>
  10. #include <drm/drm_syncobj.h>
  11. #include <drm/drm_utils.h>
  12. #include <drm/lima_drm.h>
  13. #include "lima_drv.h"
  14. #include "lima_gem.h"
  15. #include "lima_vm.h"
  16. int lima_heap_alloc(struct lima_bo *bo, struct lima_vm *vm)
  17. {
  18. struct page **pages;
  19. struct address_space *mapping = bo->base.base.filp->f_mapping;
  20. struct device *dev = bo->base.base.dev->dev;
  21. size_t old_size = bo->heap_size;
  22. size_t new_size = bo->heap_size ? bo->heap_size * 2 :
  23. (lima_heap_init_nr_pages << PAGE_SHIFT);
  24. struct sg_table sgt;
  25. int i, ret;
  26. if (bo->heap_size >= bo->base.base.size)
  27. return -ENOSPC;
  28. new_size = min(new_size, bo->base.base.size);
  29. mutex_lock(&bo->base.pages_lock);
  30. if (bo->base.pages) {
  31. pages = bo->base.pages;
  32. } else {
  33. pages = kvmalloc_array(bo->base.base.size >> PAGE_SHIFT,
  34. sizeof(*pages), GFP_KERNEL | __GFP_ZERO);
  35. if (!pages) {
  36. mutex_unlock(&bo->base.pages_lock);
  37. return -ENOMEM;
  38. }
  39. bo->base.pages = pages;
  40. bo->base.pages_use_count = 1;
  41. mapping_set_unevictable(mapping);
  42. }
  43. for (i = old_size >> PAGE_SHIFT; i < new_size >> PAGE_SHIFT; i++) {
  44. struct page *page = shmem_read_mapping_page(mapping, i);
  45. if (IS_ERR(page)) {
  46. mutex_unlock(&bo->base.pages_lock);
  47. return PTR_ERR(page);
  48. }
  49. pages[i] = page;
  50. }
  51. mutex_unlock(&bo->base.pages_lock);
  52. ret = sg_alloc_table_from_pages(&sgt, pages, i, 0,
  53. new_size, GFP_KERNEL);
  54. if (ret)
  55. return ret;
  56. if (bo->base.sgt) {
  57. dma_unmap_sgtable(dev, bo->base.sgt, DMA_BIDIRECTIONAL, 0);
  58. sg_free_table(bo->base.sgt);
  59. } else {
  60. bo->base.sgt = kmalloc(sizeof(*bo->base.sgt), GFP_KERNEL);
  61. if (!bo->base.sgt) {
  62. sg_free_table(&sgt);
  63. return -ENOMEM;
  64. }
  65. }
  66. ret = dma_map_sgtable(dev, &sgt, DMA_BIDIRECTIONAL, 0);
  67. if (ret) {
  68. sg_free_table(&sgt);
  69. kfree(bo->base.sgt);
  70. bo->base.sgt = NULL;
  71. return ret;
  72. }
  73. *bo->base.sgt = sgt;
  74. if (vm) {
  75. ret = lima_vm_map_bo(vm, bo, old_size >> PAGE_SHIFT);
  76. if (ret)
  77. return ret;
  78. }
  79. bo->heap_size = new_size;
  80. return 0;
  81. }
  82. int lima_gem_create_handle(struct drm_device *dev, struct drm_file *file,
  83. u32 size, u32 flags, u32 *handle)
  84. {
  85. int err;
  86. gfp_t mask;
  87. struct drm_gem_shmem_object *shmem;
  88. struct drm_gem_object *obj;
  89. struct lima_bo *bo;
  90. bool is_heap = flags & LIMA_BO_FLAG_HEAP;
  91. shmem = drm_gem_shmem_create(dev, size);
  92. if (IS_ERR(shmem))
  93. return PTR_ERR(shmem);
  94. obj = &shmem->base;
  95. /* Mali Utgard GPU can only support 32bit address space */
  96. mask = mapping_gfp_mask(obj->filp->f_mapping);
  97. mask &= ~__GFP_HIGHMEM;
  98. mask |= __GFP_DMA32;
  99. mapping_set_gfp_mask(obj->filp->f_mapping, mask);
  100. if (is_heap) {
  101. bo = to_lima_bo(obj);
  102. err = lima_heap_alloc(bo, NULL);
  103. if (err)
  104. goto out;
  105. } else {
  106. struct sg_table *sgt = drm_gem_shmem_get_pages_sgt(shmem);
  107. if (IS_ERR(sgt)) {
  108. err = PTR_ERR(sgt);
  109. goto out;
  110. }
  111. }
  112. err = drm_gem_handle_create(file, obj, handle);
  113. out:
  114. /* drop reference from allocate - handle holds it now */
  115. drm_gem_object_put(obj);
  116. return err;
  117. }
  118. static void lima_gem_free_object(struct drm_gem_object *obj)
  119. {
  120. struct lima_bo *bo = to_lima_bo(obj);
  121. if (!list_empty(&bo->va))
  122. dev_err(obj->dev->dev, "lima gem free bo still has va\n");
  123. drm_gem_shmem_free(&bo->base);
  124. }
  125. static int lima_gem_object_open(struct drm_gem_object *obj, struct drm_file *file)
  126. {
  127. struct lima_bo *bo = to_lima_bo(obj);
  128. struct lima_drm_priv *priv = to_lima_drm_priv(file);
  129. struct lima_vm *vm = priv->vm;
  130. return lima_vm_bo_add(vm, bo, true);
  131. }
  132. static void lima_gem_object_close(struct drm_gem_object *obj, struct drm_file *file)
  133. {
  134. struct lima_bo *bo = to_lima_bo(obj);
  135. struct lima_drm_priv *priv = to_lima_drm_priv(file);
  136. struct lima_vm *vm = priv->vm;
  137. lima_vm_bo_del(vm, bo);
  138. }
  139. static int lima_gem_pin(struct drm_gem_object *obj)
  140. {
  141. struct lima_bo *bo = to_lima_bo(obj);
  142. if (bo->heap_size)
  143. return -EINVAL;
  144. return drm_gem_shmem_pin(&bo->base);
  145. }
  146. static int lima_gem_vmap(struct drm_gem_object *obj, struct iosys_map *map)
  147. {
  148. struct lima_bo *bo = to_lima_bo(obj);
  149. if (bo->heap_size)
  150. return -EINVAL;
  151. return drm_gem_shmem_vmap(&bo->base, map);
  152. }
  153. static int lima_gem_mmap(struct drm_gem_object *obj, struct vm_area_struct *vma)
  154. {
  155. struct lima_bo *bo = to_lima_bo(obj);
  156. if (bo->heap_size)
  157. return -EINVAL;
  158. return drm_gem_shmem_mmap(&bo->base, vma);
  159. }
  160. static const struct drm_gem_object_funcs lima_gem_funcs = {
  161. .free = lima_gem_free_object,
  162. .open = lima_gem_object_open,
  163. .close = lima_gem_object_close,
  164. .print_info = drm_gem_shmem_object_print_info,
  165. .pin = lima_gem_pin,
  166. .unpin = drm_gem_shmem_object_unpin,
  167. .get_sg_table = drm_gem_shmem_object_get_sg_table,
  168. .vmap = lima_gem_vmap,
  169. .vunmap = drm_gem_shmem_object_vunmap,
  170. .mmap = lima_gem_mmap,
  171. .vm_ops = &drm_gem_shmem_vm_ops,
  172. };
  173. struct drm_gem_object *lima_gem_create_object(struct drm_device *dev, size_t size)
  174. {
  175. struct lima_bo *bo;
  176. bo = kzalloc(sizeof(*bo), GFP_KERNEL);
  177. if (!bo)
  178. return ERR_PTR(-ENOMEM);
  179. mutex_init(&bo->lock);
  180. INIT_LIST_HEAD(&bo->va);
  181. bo->base.map_wc = true;
  182. bo->base.base.funcs = &lima_gem_funcs;
  183. return &bo->base.base;
  184. }
  185. int lima_gem_get_info(struct drm_file *file, u32 handle, u32 *va, u64 *offset)
  186. {
  187. struct drm_gem_object *obj;
  188. struct lima_bo *bo;
  189. struct lima_drm_priv *priv = to_lima_drm_priv(file);
  190. struct lima_vm *vm = priv->vm;
  191. obj = drm_gem_object_lookup(file, handle);
  192. if (!obj)
  193. return -ENOENT;
  194. bo = to_lima_bo(obj);
  195. *va = lima_vm_get_va(vm, bo);
  196. *offset = drm_vma_node_offset_addr(&obj->vma_node);
  197. drm_gem_object_put(obj);
  198. return 0;
  199. }
  200. static int lima_gem_sync_bo(struct lima_sched_task *task, struct lima_bo *bo,
  201. bool write, bool explicit)
  202. {
  203. int err;
  204. err = dma_resv_reserve_fences(lima_bo_resv(bo), 1);
  205. if (err)
  206. return err;
  207. /* explicit sync use user passed dep fence */
  208. if (explicit)
  209. return 0;
  210. return drm_sched_job_add_implicit_dependencies(&task->base,
  211. &bo->base.base,
  212. write);
  213. }
  214. static int lima_gem_add_deps(struct drm_file *file, struct lima_submit *submit)
  215. {
  216. int i, err;
  217. for (i = 0; i < ARRAY_SIZE(submit->in_sync); i++) {
  218. struct dma_fence *fence = NULL;
  219. if (!submit->in_sync[i])
  220. continue;
  221. err = drm_syncobj_find_fence(file, submit->in_sync[i],
  222. 0, 0, &fence);
  223. if (err)
  224. return err;
  225. err = drm_sched_job_add_dependency(&submit->task->base, fence);
  226. if (err) {
  227. dma_fence_put(fence);
  228. return err;
  229. }
  230. }
  231. return 0;
  232. }
  233. int lima_gem_submit(struct drm_file *file, struct lima_submit *submit)
  234. {
  235. int i, err = 0;
  236. struct ww_acquire_ctx ctx;
  237. struct lima_drm_priv *priv = to_lima_drm_priv(file);
  238. struct lima_vm *vm = priv->vm;
  239. struct drm_syncobj *out_sync = NULL;
  240. struct dma_fence *fence;
  241. struct lima_bo **bos = submit->lbos;
  242. if (submit->out_sync) {
  243. out_sync = drm_syncobj_find(file, submit->out_sync);
  244. if (!out_sync)
  245. return -ENOENT;
  246. }
  247. for (i = 0; i < submit->nr_bos; i++) {
  248. struct drm_gem_object *obj;
  249. struct lima_bo *bo;
  250. obj = drm_gem_object_lookup(file, submit->bos[i].handle);
  251. if (!obj) {
  252. err = -ENOENT;
  253. goto err_out0;
  254. }
  255. bo = to_lima_bo(obj);
  256. /* increase refcnt of gpu va map to prevent unmapped when executing,
  257. * will be decreased when task done
  258. */
  259. err = lima_vm_bo_add(vm, bo, false);
  260. if (err) {
  261. drm_gem_object_put(obj);
  262. goto err_out0;
  263. }
  264. bos[i] = bo;
  265. }
  266. err = drm_gem_lock_reservations((struct drm_gem_object **)bos,
  267. submit->nr_bos, &ctx);
  268. if (err)
  269. goto err_out0;
  270. err = lima_sched_task_init(
  271. submit->task, submit->ctx->context + submit->pipe,
  272. bos, submit->nr_bos, vm);
  273. if (err)
  274. goto err_out1;
  275. err = lima_gem_add_deps(file, submit);
  276. if (err)
  277. goto err_out2;
  278. for (i = 0; i < submit->nr_bos; i++) {
  279. err = lima_gem_sync_bo(
  280. submit->task, bos[i],
  281. submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE,
  282. submit->flags & LIMA_SUBMIT_FLAG_EXPLICIT_FENCE);
  283. if (err)
  284. goto err_out2;
  285. }
  286. fence = lima_sched_context_queue_task(submit->task);
  287. for (i = 0; i < submit->nr_bos; i++) {
  288. dma_resv_add_fence(lima_bo_resv(bos[i]), fence,
  289. submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE ?
  290. DMA_RESV_USAGE_WRITE : DMA_RESV_USAGE_READ);
  291. }
  292. drm_gem_unlock_reservations((struct drm_gem_object **)bos,
  293. submit->nr_bos, &ctx);
  294. for (i = 0; i < submit->nr_bos; i++)
  295. drm_gem_object_put(&bos[i]->base.base);
  296. if (out_sync) {
  297. drm_syncobj_replace_fence(out_sync, fence);
  298. drm_syncobj_put(out_sync);
  299. }
  300. dma_fence_put(fence);
  301. return 0;
  302. err_out2:
  303. lima_sched_task_fini(submit->task);
  304. err_out1:
  305. drm_gem_unlock_reservations((struct drm_gem_object **)bos,
  306. submit->nr_bos, &ctx);
  307. err_out0:
  308. for (i = 0; i < submit->nr_bos; i++) {
  309. if (!bos[i])
  310. break;
  311. lima_vm_bo_del(vm, bos[i]);
  312. drm_gem_object_put(&bos[i]->base.base);
  313. }
  314. if (out_sync)
  315. drm_syncobj_put(out_sync);
  316. return err;
  317. }
  318. int lima_gem_wait(struct drm_file *file, u32 handle, u32 op, s64 timeout_ns)
  319. {
  320. bool write = op & LIMA_GEM_WAIT_WRITE;
  321. long ret, timeout;
  322. if (!op)
  323. return 0;
  324. timeout = drm_timeout_abs_to_jiffies(timeout_ns);
  325. ret = drm_gem_dma_resv_wait(file, handle, write, timeout);
  326. if (ret == -ETIME)
  327. ret = timeout ? -ETIMEDOUT : -EBUSY;
  328. return ret;
  329. }