2 * SPDX-License-Identifier: MIT
4 * Copyright 2012 Red Hat Inc
7 #include <linux/dma-buf.h>
8 #include <linux/highmem.h>
9 #include <linux/dma-resv.h>
10 #include <linux/module.h>
15 #include "i915_gem_object.h"
16 #include "i915_scatterlist.h"
18 MODULE_IMPORT_NS(DMA_BUF);
20 I915_SELFTEST_DECLARE(static bool force_different_devices;)
22 static struct drm_i915_gem_object *dma_buf_to_obj(struct dma_buf *buf)
24 return to_intel_bo(buf->priv);
27 static struct sg_table *i915_gem_map_dma_buf(struct dma_buf_attachment *attachment,
28 enum dma_data_direction dir)
30 struct drm_i915_gem_object *obj = dma_buf_to_obj(attachment->dmabuf);
32 struct scatterlist *src, *dst;
35 /* Copy sg so that we make an independent mapping */
36 st = kmalloc(sizeof(struct sg_table), GFP_KERNEL);
42 ret = sg_alloc_table(st, obj->mm.pages->nents, GFP_KERNEL);
46 src = obj->mm.pages->sgl;
48 for (i = 0; i < obj->mm.pages->nents; i++) {
49 sg_set_page(dst, sg_page(src), src->length, 0);
54 ret = dma_map_sgtable(attachment->dev, st, dir, DMA_ATTR_SKIP_CPU_SYNC);
68 static void i915_gem_unmap_dma_buf(struct dma_buf_attachment *attachment,
70 enum dma_data_direction dir)
72 dma_unmap_sgtable(attachment->dev, sg, dir, DMA_ATTR_SKIP_CPU_SYNC);
77 static int i915_gem_dmabuf_vmap(struct dma_buf *dma_buf,
78 struct iosys_map *map)
80 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
83 vaddr = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WB);
85 return PTR_ERR(vaddr);
87 iosys_map_set_vaddr(map, vaddr);
92 static void i915_gem_dmabuf_vunmap(struct dma_buf *dma_buf,
93 struct iosys_map *map)
95 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
97 i915_gem_object_flush_map(obj);
98 i915_gem_object_unpin_map(obj);
101 static int i915_gem_dmabuf_mmap(struct dma_buf *dma_buf, struct vm_area_struct *vma)
103 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
106 if (obj->base.size < vma->vm_end - vma->vm_start)
112 ret = call_mmap(obj->base.filp, vma);
116 vma_set_file(vma, obj->base.filp);
121 static int i915_gem_begin_cpu_access(struct dma_buf *dma_buf, enum dma_data_direction direction)
123 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
124 bool write = (direction == DMA_BIDIRECTIONAL || direction == DMA_TO_DEVICE);
125 struct i915_gem_ww_ctx ww;
128 i915_gem_ww_ctx_init(&ww, true);
130 err = i915_gem_object_lock(obj, &ww);
132 err = i915_gem_object_pin_pages(obj);
134 err = i915_gem_object_set_to_cpu_domain(obj, write);
135 i915_gem_object_unpin_pages(obj);
137 if (err == -EDEADLK) {
138 err = i915_gem_ww_ctx_backoff(&ww);
142 i915_gem_ww_ctx_fini(&ww);
146 static int i915_gem_end_cpu_access(struct dma_buf *dma_buf, enum dma_data_direction direction)
148 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
149 struct i915_gem_ww_ctx ww;
152 i915_gem_ww_ctx_init(&ww, true);
154 err = i915_gem_object_lock(obj, &ww);
156 err = i915_gem_object_pin_pages(obj);
158 err = i915_gem_object_set_to_gtt_domain(obj, false);
159 i915_gem_object_unpin_pages(obj);
161 if (err == -EDEADLK) {
162 err = i915_gem_ww_ctx_backoff(&ww);
166 i915_gem_ww_ctx_fini(&ww);
170 static int i915_gem_dmabuf_attach(struct dma_buf *dmabuf,
171 struct dma_buf_attachment *attach)
173 struct drm_i915_gem_object *obj = dma_buf_to_obj(dmabuf);
174 struct i915_gem_ww_ctx ww;
177 if (!i915_gem_object_can_migrate(obj, INTEL_REGION_SMEM))
180 for_i915_gem_ww(&ww, err, true) {
181 err = i915_gem_object_lock(obj, &ww);
185 err = i915_gem_object_migrate(obj, &ww, INTEL_REGION_SMEM);
189 err = i915_gem_object_wait_migration(obj, 0);
193 err = i915_gem_object_pin_pages(obj);
199 static void i915_gem_dmabuf_detach(struct dma_buf *dmabuf,
200 struct dma_buf_attachment *attach)
202 struct drm_i915_gem_object *obj = dma_buf_to_obj(dmabuf);
204 i915_gem_object_unpin_pages(obj);
207 static const struct dma_buf_ops i915_dmabuf_ops = {
208 .attach = i915_gem_dmabuf_attach,
209 .detach = i915_gem_dmabuf_detach,
210 .map_dma_buf = i915_gem_map_dma_buf,
211 .unmap_dma_buf = i915_gem_unmap_dma_buf,
212 .release = drm_gem_dmabuf_release,
213 .mmap = i915_gem_dmabuf_mmap,
214 .vmap = i915_gem_dmabuf_vmap,
215 .vunmap = i915_gem_dmabuf_vunmap,
216 .begin_cpu_access = i915_gem_begin_cpu_access,
217 .end_cpu_access = i915_gem_end_cpu_access,
220 struct dma_buf *i915_gem_prime_export(struct drm_gem_object *gem_obj, int flags)
222 struct drm_i915_gem_object *obj = to_intel_bo(gem_obj);
223 DEFINE_DMA_BUF_EXPORT_INFO(exp_info);
225 exp_info.ops = &i915_dmabuf_ops;
226 exp_info.size = gem_obj->size;
227 exp_info.flags = flags;
228 exp_info.priv = gem_obj;
229 exp_info.resv = obj->base.resv;
231 if (obj->ops->dmabuf_export) {
232 int ret = obj->ops->dmabuf_export(obj);
237 return drm_gem_dmabuf_export(gem_obj->dev, &exp_info);
240 static int i915_gem_object_get_pages_dmabuf(struct drm_i915_gem_object *obj)
242 struct drm_i915_private *i915 = to_i915(obj->base.dev);
243 struct sg_table *pages;
244 unsigned int sg_page_sizes;
246 assert_object_held(obj);
248 pages = dma_buf_map_attachment(obj->base.import_attach,
251 return PTR_ERR(pages);
254 * DG1 is special here since it still snoops transactions even with
255 * CACHE_NONE. This is not the case with other HAS_SNOOP platforms. We
256 * might need to revisit this as we add new discrete platforms.
258 * XXX: Consider doing a vmap flush or something, where possible.
259 * Currently we just do a heavy handed wbinvd_on_all_cpus() here since
260 * the underlying sg_table might not even point to struct pages, so we
261 * can't just call drm_clflush_sg or similar, like we do elsewhere in
264 if (i915_gem_object_can_bypass_llc(obj) ||
265 (!HAS_LLC(i915) && !IS_DG1(i915)))
266 wbinvd_on_all_cpus();
268 sg_page_sizes = i915_sg_dma_sizes(pages->sgl);
269 __i915_gem_object_set_pages(obj, pages, sg_page_sizes);
274 static void i915_gem_object_put_pages_dmabuf(struct drm_i915_gem_object *obj,
275 struct sg_table *pages)
277 dma_buf_unmap_attachment(obj->base.import_attach, pages,
281 static const struct drm_i915_gem_object_ops i915_gem_object_dmabuf_ops = {
282 .name = "i915_gem_object_dmabuf",
283 .get_pages = i915_gem_object_get_pages_dmabuf,
284 .put_pages = i915_gem_object_put_pages_dmabuf,
287 struct drm_gem_object *i915_gem_prime_import(struct drm_device *dev,
288 struct dma_buf *dma_buf)
290 static struct lock_class_key lock_class;
291 struct dma_buf_attachment *attach;
292 struct drm_i915_gem_object *obj;
295 /* is this one of own objects? */
296 if (dma_buf->ops == &i915_dmabuf_ops) {
297 obj = dma_buf_to_obj(dma_buf);
298 /* is it from our device? */
299 if (obj->base.dev == dev &&
300 !I915_SELFTEST_ONLY(force_different_devices)) {
302 * Importing dmabuf exported from out own gem increases
303 * refcount on gem itself instead of f_count of dmabuf.
305 return &i915_gem_object_get(obj)->base;
309 if (i915_gem_object_size_2big(dma_buf->size))
310 return ERR_PTR(-E2BIG);
313 attach = dma_buf_attach(dma_buf, dev->dev);
315 return ERR_CAST(attach);
317 get_dma_buf(dma_buf);
319 obj = i915_gem_object_alloc();
325 drm_gem_private_object_init(dev, &obj->base, dma_buf->size);
326 i915_gem_object_init(obj, &i915_gem_object_dmabuf_ops, &lock_class,
328 obj->base.import_attach = attach;
329 obj->base.resv = dma_buf->resv;
331 /* We use GTT as shorthand for a coherent domain, one that is
332 * neither in the GPU cache nor in the CPU cache, where all
333 * writes are immediately visible in memory. (That's not strictly
334 * true, but it's close! There are internal buffers such as the
335 * write-combined buffer or a delay through the chipset for GTT
336 * writes that do require us to treat GTT as a separate cache domain.)
338 obj->read_domains = I915_GEM_DOMAIN_GTT;
339 obj->write_domain = 0;
344 dma_buf_detach(dma_buf, attach);
345 dma_buf_put(dma_buf);
350 #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
351 #include "selftests/mock_dmabuf.c"
352 #include "selftests/i915_gem_dmabuf.c"