2 * SPDX-License-Identifier: MIT
4 * Copyright 2012 Red Hat Inc
7 #include <linux/dma-buf.h>
8 #include <linux/highmem.h>
9 #include <linux/dma-resv.h>
10 #include <linux/module.h>
15 #include "i915_gem_object.h"
16 #include "i915_scatterlist.h"
18 MODULE_IMPORT_NS(DMA_BUF);
20 #if defined(CONFIG_X86)
23 #define wbinvd_on_all_cpus() \
24 pr_warn(DRIVER_NAME ": Missing cache flush in %s\n", __func__)
27 I915_SELFTEST_DECLARE(static bool force_different_devices;)
29 static struct drm_i915_gem_object *dma_buf_to_obj(struct dma_buf *buf)
31 return to_intel_bo(buf->priv);
34 static struct sg_table *i915_gem_map_dma_buf(struct dma_buf_attachment *attachment,
35 enum dma_data_direction dir)
37 struct drm_i915_gem_object *obj = dma_buf_to_obj(attachment->dmabuf);
39 struct scatterlist *src, *dst;
42 /* Copy sg so that we make an independent mapping */
43 st = kmalloc(sizeof(struct sg_table), GFP_KERNEL);
49 ret = sg_alloc_table(st, obj->mm.pages->nents, GFP_KERNEL);
53 src = obj->mm.pages->sgl;
55 for (i = 0; i < obj->mm.pages->nents; i++) {
56 sg_set_page(dst, sg_page(src), src->length, 0);
61 ret = dma_map_sgtable(attachment->dev, st, dir, DMA_ATTR_SKIP_CPU_SYNC);
75 static void i915_gem_unmap_dma_buf(struct dma_buf_attachment *attachment,
77 enum dma_data_direction dir)
79 dma_unmap_sgtable(attachment->dev, sg, dir, DMA_ATTR_SKIP_CPU_SYNC);
84 static int i915_gem_dmabuf_vmap(struct dma_buf *dma_buf, struct dma_buf_map *map)
86 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
89 vaddr = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WB);
91 return PTR_ERR(vaddr);
93 dma_buf_map_set_vaddr(map, vaddr);
98 static void i915_gem_dmabuf_vunmap(struct dma_buf *dma_buf, struct dma_buf_map *map)
100 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
102 i915_gem_object_flush_map(obj);
103 i915_gem_object_unpin_map(obj);
106 static int i915_gem_dmabuf_mmap(struct dma_buf *dma_buf, struct vm_area_struct *vma)
108 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
111 if (obj->base.size < vma->vm_end - vma->vm_start)
117 ret = call_mmap(obj->base.filp, vma);
121 vma_set_file(vma, obj->base.filp);
126 static int i915_gem_begin_cpu_access(struct dma_buf *dma_buf, enum dma_data_direction direction)
128 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
129 bool write = (direction == DMA_BIDIRECTIONAL || direction == DMA_TO_DEVICE);
130 struct i915_gem_ww_ctx ww;
133 i915_gem_ww_ctx_init(&ww, true);
135 err = i915_gem_object_lock(obj, &ww);
137 err = i915_gem_object_pin_pages(obj);
139 err = i915_gem_object_set_to_cpu_domain(obj, write);
140 i915_gem_object_unpin_pages(obj);
142 if (err == -EDEADLK) {
143 err = i915_gem_ww_ctx_backoff(&ww);
147 i915_gem_ww_ctx_fini(&ww);
151 static int i915_gem_end_cpu_access(struct dma_buf *dma_buf, enum dma_data_direction direction)
153 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf);
154 struct i915_gem_ww_ctx ww;
157 i915_gem_ww_ctx_init(&ww, true);
159 err = i915_gem_object_lock(obj, &ww);
161 err = i915_gem_object_pin_pages(obj);
163 err = i915_gem_object_set_to_gtt_domain(obj, false);
164 i915_gem_object_unpin_pages(obj);
166 if (err == -EDEADLK) {
167 err = i915_gem_ww_ctx_backoff(&ww);
171 i915_gem_ww_ctx_fini(&ww);
175 static int i915_gem_dmabuf_attach(struct dma_buf *dmabuf,
176 struct dma_buf_attachment *attach)
178 struct drm_i915_gem_object *obj = dma_buf_to_obj(dmabuf);
179 struct i915_gem_ww_ctx ww;
182 if (!i915_gem_object_can_migrate(obj, INTEL_REGION_SMEM))
185 for_i915_gem_ww(&ww, err, true) {
186 err = i915_gem_object_lock(obj, &ww);
190 err = i915_gem_object_migrate(obj, &ww, INTEL_REGION_SMEM);
194 err = i915_gem_object_wait_migration(obj, 0);
198 err = i915_gem_object_pin_pages(obj);
204 static void i915_gem_dmabuf_detach(struct dma_buf *dmabuf,
205 struct dma_buf_attachment *attach)
207 struct drm_i915_gem_object *obj = dma_buf_to_obj(dmabuf);
209 i915_gem_object_unpin_pages(obj);
212 static const struct dma_buf_ops i915_dmabuf_ops = {
213 .attach = i915_gem_dmabuf_attach,
214 .detach = i915_gem_dmabuf_detach,
215 .map_dma_buf = i915_gem_map_dma_buf,
216 .unmap_dma_buf = i915_gem_unmap_dma_buf,
217 .release = drm_gem_dmabuf_release,
218 .mmap = i915_gem_dmabuf_mmap,
219 .vmap = i915_gem_dmabuf_vmap,
220 .vunmap = i915_gem_dmabuf_vunmap,
221 .begin_cpu_access = i915_gem_begin_cpu_access,
222 .end_cpu_access = i915_gem_end_cpu_access,
225 struct dma_buf *i915_gem_prime_export(struct drm_gem_object *gem_obj, int flags)
227 struct drm_i915_gem_object *obj = to_intel_bo(gem_obj);
228 DEFINE_DMA_BUF_EXPORT_INFO(exp_info);
230 exp_info.ops = &i915_dmabuf_ops;
231 exp_info.size = gem_obj->size;
232 exp_info.flags = flags;
233 exp_info.priv = gem_obj;
234 exp_info.resv = obj->base.resv;
236 if (obj->ops->dmabuf_export) {
237 int ret = obj->ops->dmabuf_export(obj);
242 return drm_gem_dmabuf_export(gem_obj->dev, &exp_info);
245 static int i915_gem_object_get_pages_dmabuf(struct drm_i915_gem_object *obj)
247 struct drm_i915_private *i915 = to_i915(obj->base.dev);
248 struct sg_table *pages;
249 unsigned int sg_page_sizes;
251 assert_object_held(obj);
253 pages = dma_buf_map_attachment(obj->base.import_attach,
256 return PTR_ERR(pages);
259 * DG1 is special here since it still snoops transactions even with
260 * CACHE_NONE. This is not the case with other HAS_SNOOP platforms. We
261 * might need to revisit this as we add new discrete platforms.
263 * XXX: Consider doing a vmap flush or something, where possible.
264 * Currently we just do a heavy handed wbinvd_on_all_cpus() here since
265 * the underlying sg_table might not even point to struct pages, so we
266 * can't just call drm_clflush_sg or similar, like we do elsewhere in
269 if (i915_gem_object_can_bypass_llc(obj) ||
270 (!HAS_LLC(i915) && !IS_DG1(i915)))
271 wbinvd_on_all_cpus();
273 sg_page_sizes = i915_sg_dma_sizes(pages->sgl);
274 __i915_gem_object_set_pages(obj, pages, sg_page_sizes);
279 static void i915_gem_object_put_pages_dmabuf(struct drm_i915_gem_object *obj,
280 struct sg_table *pages)
282 dma_buf_unmap_attachment(obj->base.import_attach, pages,
286 static const struct drm_i915_gem_object_ops i915_gem_object_dmabuf_ops = {
287 .name = "i915_gem_object_dmabuf",
288 .get_pages = i915_gem_object_get_pages_dmabuf,
289 .put_pages = i915_gem_object_put_pages_dmabuf,
292 struct drm_gem_object *i915_gem_prime_import(struct drm_device *dev,
293 struct dma_buf *dma_buf)
295 static struct lock_class_key lock_class;
296 struct dma_buf_attachment *attach;
297 struct drm_i915_gem_object *obj;
300 /* is this one of own objects? */
301 if (dma_buf->ops == &i915_dmabuf_ops) {
302 obj = dma_buf_to_obj(dma_buf);
303 /* is it from our device? */
304 if (obj->base.dev == dev &&
305 !I915_SELFTEST_ONLY(force_different_devices)) {
307 * Importing dmabuf exported from out own gem increases
308 * refcount on gem itself instead of f_count of dmabuf.
310 return &i915_gem_object_get(obj)->base;
314 if (i915_gem_object_size_2big(dma_buf->size))
315 return ERR_PTR(-E2BIG);
318 attach = dma_buf_attach(dma_buf, dev->dev);
320 return ERR_CAST(attach);
322 get_dma_buf(dma_buf);
324 obj = i915_gem_object_alloc();
330 drm_gem_private_object_init(dev, &obj->base, dma_buf->size);
331 i915_gem_object_init(obj, &i915_gem_object_dmabuf_ops, &lock_class,
333 obj->base.import_attach = attach;
334 obj->base.resv = dma_buf->resv;
336 /* We use GTT as shorthand for a coherent domain, one that is
337 * neither in the GPU cache nor in the CPU cache, where all
338 * writes are immediately visible in memory. (That's not strictly
339 * true, but it's close! There are internal buffers such as the
340 * write-combined buffer or a delay through the chipset for GTT
341 * writes that do require us to treat GTT as a separate cache domain.)
343 obj->read_domains = I915_GEM_DOMAIN_GTT;
344 obj->write_domain = 0;
349 dma_buf_detach(dma_buf, attach);
350 dma_buf_put(dma_buf);
355 #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST)
356 #include "selftests/mock_dmabuf.c"
357 #include "selftests/i915_gem_dmabuf.c"