1 /* 2 * SPDX-License-Identifier: MIT 3 * 4 * Copyright 2012 Red Hat Inc 5 */ 6 7 #include <linux/dma-buf.h> 8 #include <linux/highmem.h> 9 #include <linux/dma-resv.h> 10 #include <linux/module.h> 11 12 #include <asm/smp.h> 13 14 #include "gem/i915_gem_dmabuf.h" 15 #include "i915_drv.h" 16 #include "i915_gem_object.h" 17 #include "i915_scatterlist.h" 18 19 MODULE_IMPORT_NS(DMA_BUF); 20 21 I915_SELFTEST_DECLARE(static bool force_different_devices;) 22 23 static struct drm_i915_gem_object *dma_buf_to_obj(struct dma_buf *buf) 24 { 25 return to_intel_bo(buf->priv); 26 } 27 28 static struct sg_table *i915_gem_map_dma_buf(struct dma_buf_attachment *attach, 29 enum dma_data_direction dir) 30 { 31 struct drm_i915_gem_object *obj = dma_buf_to_obj(attach->dmabuf); 32 struct sg_table *sgt; 33 struct scatterlist *src, *dst; 34 int ret, i; 35 36 /* 37 * Make a copy of the object's sgt, so that we can make an independent 38 * mapping 39 */ 40 sgt = kmalloc(sizeof(*sgt), GFP_KERNEL); 41 if (!sgt) { 42 ret = -ENOMEM; 43 goto err; 44 } 45 46 ret = sg_alloc_table(sgt, obj->mm.pages->orig_nents, GFP_KERNEL); 47 if (ret) 48 goto err_free; 49 50 dst = sgt->sgl; 51 for_each_sg(obj->mm.pages->sgl, src, obj->mm.pages->orig_nents, i) { 52 sg_set_page(dst, sg_page(src), src->length, 0); 53 dst = sg_next(dst); 54 } 55 56 ret = dma_map_sgtable(attach->dev, sgt, dir, DMA_ATTR_SKIP_CPU_SYNC); 57 if (ret) 58 goto err_free_sg; 59 60 return sgt; 61 62 err_free_sg: 63 sg_free_table(sgt); 64 err_free: 65 kfree(sgt); 66 err: 67 return ERR_PTR(ret); 68 } 69 70 static int i915_gem_dmabuf_vmap(struct dma_buf *dma_buf, 71 struct iosys_map *map) 72 { 73 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf); 74 void *vaddr; 75 76 vaddr = i915_gem_object_pin_map(obj, I915_MAP_WB); 77 if (IS_ERR(vaddr)) 78 return PTR_ERR(vaddr); 79 80 iosys_map_set_vaddr(map, vaddr); 81 82 return 0; 83 } 84 85 static void i915_gem_dmabuf_vunmap(struct dma_buf *dma_buf, 86 struct iosys_map *map) 87 { 88 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf); 89 90 i915_gem_object_flush_map(obj); 91 i915_gem_object_unpin_map(obj); 92 } 93 94 static int i915_gem_dmabuf_mmap(struct dma_buf *dma_buf, struct vm_area_struct *vma) 95 { 96 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf); 97 struct drm_i915_private *i915 = to_i915(obj->base.dev); 98 int ret; 99 100 if (obj->base.size < vma->vm_end - vma->vm_start) 101 return -EINVAL; 102 103 if (HAS_LMEM(i915)) 104 return drm_gem_prime_mmap(&obj->base, vma); 105 106 if (!obj->base.filp) 107 return -ENODEV; 108 109 ret = call_mmap(obj->base.filp, vma); 110 if (ret) 111 return ret; 112 113 vma_set_file(vma, obj->base.filp); 114 115 return 0; 116 } 117 118 static int i915_gem_begin_cpu_access(struct dma_buf *dma_buf, enum dma_data_direction direction) 119 { 120 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf); 121 bool write = (direction == DMA_BIDIRECTIONAL || direction == DMA_TO_DEVICE); 122 struct i915_gem_ww_ctx ww; 123 int err; 124 125 i915_gem_ww_ctx_init(&ww, true); 126 retry: 127 err = i915_gem_object_lock(obj, &ww); 128 if (!err) 129 err = i915_gem_object_pin_pages(obj); 130 if (!err) { 131 err = i915_gem_object_set_to_cpu_domain(obj, write); 132 i915_gem_object_unpin_pages(obj); 133 } 134 if (err == -EDEADLK) { 135 err = i915_gem_ww_ctx_backoff(&ww); 136 if (!err) 137 goto retry; 138 } 139 i915_gem_ww_ctx_fini(&ww); 140 return err; 141 } 142 143 static int i915_gem_end_cpu_access(struct dma_buf *dma_buf, enum dma_data_direction direction) 144 { 145 struct drm_i915_gem_object *obj = dma_buf_to_obj(dma_buf); 146 struct i915_gem_ww_ctx ww; 147 int err; 148 149 i915_gem_ww_ctx_init(&ww, true); 150 retry: 151 err = i915_gem_object_lock(obj, &ww); 152 if (!err) 153 err = i915_gem_object_pin_pages(obj); 154 if (!err) { 155 err = i915_gem_object_set_to_gtt_domain(obj, false); 156 i915_gem_object_unpin_pages(obj); 157 } 158 if (err == -EDEADLK) { 159 err = i915_gem_ww_ctx_backoff(&ww); 160 if (!err) 161 goto retry; 162 } 163 i915_gem_ww_ctx_fini(&ww); 164 return err; 165 } 166 167 static int i915_gem_dmabuf_attach(struct dma_buf *dmabuf, 168 struct dma_buf_attachment *attach) 169 { 170 struct drm_i915_gem_object *obj = dma_buf_to_obj(dmabuf); 171 struct i915_gem_ww_ctx ww; 172 int err; 173 174 if (!i915_gem_object_can_migrate(obj, INTEL_REGION_SMEM)) 175 return -EOPNOTSUPP; 176 177 for_i915_gem_ww(&ww, err, true) { 178 err = i915_gem_object_lock(obj, &ww); 179 if (err) 180 continue; 181 182 err = i915_gem_object_migrate(obj, &ww, INTEL_REGION_SMEM); 183 if (err) 184 continue; 185 186 err = i915_gem_object_wait_migration(obj, 0); 187 if (err) 188 continue; 189 190 err = i915_gem_object_pin_pages(obj); 191 } 192 193 return err; 194 } 195 196 static void i915_gem_dmabuf_detach(struct dma_buf *dmabuf, 197 struct dma_buf_attachment *attach) 198 { 199 struct drm_i915_gem_object *obj = dma_buf_to_obj(dmabuf); 200 201 i915_gem_object_unpin_pages(obj); 202 } 203 204 static const struct dma_buf_ops i915_dmabuf_ops = { 205 .attach = i915_gem_dmabuf_attach, 206 .detach = i915_gem_dmabuf_detach, 207 .map_dma_buf = i915_gem_map_dma_buf, 208 .unmap_dma_buf = drm_gem_unmap_dma_buf, 209 .release = drm_gem_dmabuf_release, 210 .mmap = i915_gem_dmabuf_mmap, 211 .vmap = i915_gem_dmabuf_vmap, 212 .vunmap = i915_gem_dmabuf_vunmap, 213 .begin_cpu_access = i915_gem_begin_cpu_access, 214 .end_cpu_access = i915_gem_end_cpu_access, 215 }; 216 217 struct dma_buf *i915_gem_prime_export(struct drm_gem_object *gem_obj, int flags) 218 { 219 struct drm_i915_gem_object *obj = to_intel_bo(gem_obj); 220 DEFINE_DMA_BUF_EXPORT_INFO(exp_info); 221 222 exp_info.ops = &i915_dmabuf_ops; 223 exp_info.size = gem_obj->size; 224 exp_info.flags = flags; 225 exp_info.priv = gem_obj; 226 exp_info.resv = obj->base.resv; 227 228 if (obj->ops->dmabuf_export) { 229 int ret = obj->ops->dmabuf_export(obj); 230 if (ret) 231 return ERR_PTR(ret); 232 } 233 234 return drm_gem_dmabuf_export(gem_obj->dev, &exp_info); 235 } 236 237 static int i915_gem_object_get_pages_dmabuf(struct drm_i915_gem_object *obj) 238 { 239 struct drm_i915_private *i915 = to_i915(obj->base.dev); 240 struct sg_table *sgt; 241 unsigned int sg_page_sizes; 242 243 assert_object_held(obj); 244 245 sgt = dma_buf_map_attachment(obj->base.import_attach, 246 DMA_BIDIRECTIONAL); 247 if (IS_ERR(sgt)) 248 return PTR_ERR(sgt); 249 250 /* 251 * DG1 is special here since it still snoops transactions even with 252 * CACHE_NONE. This is not the case with other HAS_SNOOP platforms. We 253 * might need to revisit this as we add new discrete platforms. 254 * 255 * XXX: Consider doing a vmap flush or something, where possible. 256 * Currently we just do a heavy handed wbinvd_on_all_cpus() here since 257 * the underlying sg_table might not even point to struct pages, so we 258 * can't just call drm_clflush_sg or similar, like we do elsewhere in 259 * the driver. 260 */ 261 if (i915_gem_object_can_bypass_llc(obj) || 262 (!HAS_LLC(i915) && !IS_DG1(i915))) 263 wbinvd_on_all_cpus(); 264 265 sg_page_sizes = i915_sg_dma_sizes(sgt->sgl); 266 __i915_gem_object_set_pages(obj, sgt, sg_page_sizes); 267 268 return 0; 269 } 270 271 static void i915_gem_object_put_pages_dmabuf(struct drm_i915_gem_object *obj, 272 struct sg_table *sgt) 273 { 274 dma_buf_unmap_attachment(obj->base.import_attach, sgt, 275 DMA_BIDIRECTIONAL); 276 } 277 278 static const struct drm_i915_gem_object_ops i915_gem_object_dmabuf_ops = { 279 .name = "i915_gem_object_dmabuf", 280 .get_pages = i915_gem_object_get_pages_dmabuf, 281 .put_pages = i915_gem_object_put_pages_dmabuf, 282 }; 283 284 struct drm_gem_object *i915_gem_prime_import(struct drm_device *dev, 285 struct dma_buf *dma_buf) 286 { 287 static struct lock_class_key lock_class; 288 struct dma_buf_attachment *attach; 289 struct drm_i915_gem_object *obj; 290 int ret; 291 292 /* is this one of own objects? */ 293 if (dma_buf->ops == &i915_dmabuf_ops) { 294 obj = dma_buf_to_obj(dma_buf); 295 /* is it from our device? */ 296 if (obj->base.dev == dev && 297 !I915_SELFTEST_ONLY(force_different_devices)) { 298 /* 299 * Importing dmabuf exported from out own gem increases 300 * refcount on gem itself instead of f_count of dmabuf. 301 */ 302 return &i915_gem_object_get(obj)->base; 303 } 304 } 305 306 if (i915_gem_object_size_2big(dma_buf->size)) 307 return ERR_PTR(-E2BIG); 308 309 /* need to attach */ 310 attach = dma_buf_attach(dma_buf, dev->dev); 311 if (IS_ERR(attach)) 312 return ERR_CAST(attach); 313 314 get_dma_buf(dma_buf); 315 316 obj = i915_gem_object_alloc(); 317 if (!obj) { 318 ret = -ENOMEM; 319 goto fail_detach; 320 } 321 322 drm_gem_private_object_init(dev, &obj->base, dma_buf->size); 323 i915_gem_object_init(obj, &i915_gem_object_dmabuf_ops, &lock_class, 324 I915_BO_ALLOC_USER); 325 obj->base.import_attach = attach; 326 obj->base.resv = dma_buf->resv; 327 328 /* We use GTT as shorthand for a coherent domain, one that is 329 * neither in the GPU cache nor in the CPU cache, where all 330 * writes are immediately visible in memory. (That's not strictly 331 * true, but it's close! There are internal buffers such as the 332 * write-combined buffer or a delay through the chipset for GTT 333 * writes that do require us to treat GTT as a separate cache domain.) 334 */ 335 obj->read_domains = I915_GEM_DOMAIN_GTT; 336 obj->write_domain = 0; 337 338 return &obj->base; 339 340 fail_detach: 341 dma_buf_detach(dma_buf, attach); 342 dma_buf_put(dma_buf); 343 344 return ERR_PTR(ret); 345 } 346 347 #if IS_ENABLED(CONFIG_DRM_I915_SELFTEST) 348 #include "selftests/mock_dmabuf.c" 349 #include "selftests/i915_gem_dmabuf.c" 350 #endif 351