// SPDX-License-Identifier: MIT /* * Copyright (C) 2015 Red Hat, Inc. * All Rights Reserved. * * Authors: * Dave Airlie * Alon Levy */ #include #include #include #include #include #include #include #include "virtgpu_drv.h" struct virtio_gpu_submit_post_dep { struct drm_syncobj *syncobj; struct dma_fence_chain *chain; u64 point; }; struct virtio_gpu_submit { struct virtio_gpu_submit_post_dep *post_deps; unsigned int num_out_syncobjs; struct drm_syncobj **in_syncobjs; unsigned int num_in_syncobjs; struct virtio_gpu_object_array *buflist; struct drm_virtgpu_execbuffer *exbuf; struct virtio_gpu_fence *out_fence; struct virtio_gpu_fpriv *vfpriv; struct virtio_gpu_device *vgdev; struct sync_file *sync_file; struct drm_file *file; int out_fence_fd; u64 fence_ctx; u32 ring_idx; void *buf; }; static int virtio_gpu_do_fence_wait(struct virtio_gpu_submit *submit, struct dma_fence *in_fence) { u32 context = submit->fence_ctx + submit->ring_idx; if (dma_fence_match_context(in_fence, context)) return 0; return dma_fence_wait(in_fence, true); } static int virtio_gpu_dma_fence_wait(struct virtio_gpu_submit *submit, struct dma_fence *fence) { struct dma_fence_unwrap itr; struct dma_fence *f; int err; dma_fence_unwrap_for_each(f, &itr, fence) { err = virtio_gpu_do_fence_wait(submit, f); if (err) return err; } return 0; } static void virtio_gpu_free_syncobjs(struct drm_syncobj **syncobjs, u32 nr_syncobjs) { u32 i = nr_syncobjs; while (i--) { if (syncobjs[i]) drm_syncobj_put(syncobjs[i]); } kvfree(syncobjs); } static int virtio_gpu_parse_deps(struct virtio_gpu_submit *submit) { struct drm_virtgpu_execbuffer *exbuf = submit->exbuf; struct drm_virtgpu_execbuffer_syncobj syncobj_desc; size_t syncobj_stride = exbuf->syncobj_stride; u32 num_in_syncobjs = exbuf->num_in_syncobjs; struct drm_syncobj **syncobjs; int ret = 0, i; if (!num_in_syncobjs) return 0; /* * kvalloc at first tries to allocate memory using kmalloc and * falls back to vmalloc only on failure. It also uses __GFP_NOWARN * internally for allocations larger than a page size, preventing * storm of KMSG warnings. */ syncobjs = kvcalloc(num_in_syncobjs, sizeof(*syncobjs), GFP_KERNEL); if (!syncobjs) return -ENOMEM; for (i = 0; i < num_in_syncobjs; i++) { u64 address = exbuf->in_syncobjs + i * syncobj_stride; struct dma_fence *fence; memset(&syncobj_desc, 0, sizeof(syncobj_desc)); if (copy_from_user(&syncobj_desc, u64_to_user_ptr(address), min(syncobj_stride, sizeof(syncobj_desc)))) { ret = -EFAULT; break; } if (syncobj_desc.flags & ~VIRTGPU_EXECBUF_SYNCOBJ_FLAGS) { ret = -EINVAL; break; } ret = drm_syncobj_find_fence(submit->file, syncobj_desc.handle, syncobj_desc.point, 0, &fence); if (ret) break; ret = virtio_gpu_dma_fence_wait(submit, fence); dma_fence_put(fence); if (ret) break; if (syncobj_desc.flags & VIRTGPU_EXECBUF_SYNCOBJ_RESET) { syncobjs[i] = drm_syncobj_find(submit->file, syncobj_desc.handle); if (!syncobjs[i]) { ret = -EINVAL; break; } } } if (ret) { virtio_gpu_free_syncobjs(syncobjs, i); return ret; } submit->num_in_syncobjs = num_in_syncobjs; submit->in_syncobjs = syncobjs; return ret; } static void virtio_gpu_reset_syncobjs(struct drm_syncobj **syncobjs, u32 nr_syncobjs) { u32 i; for (i = 0; i < nr_syncobjs; i++) { if (syncobjs[i]) drm_syncobj_replace_fence(syncobjs[i], NULL); } } static void virtio_gpu_free_post_deps(struct virtio_gpu_submit_post_dep *post_deps, u32 nr_syncobjs) { u32 i = nr_syncobjs; while (i--) { kfree(post_deps[i].chain); drm_syncobj_put(post_deps[i].syncobj); } kvfree(post_deps); } static int virtio_gpu_parse_post_deps(struct virtio_gpu_submit *submit) { struct drm_virtgpu_execbuffer *exbuf = submit->exbuf; struct drm_virtgpu_execbuffer_syncobj syncobj_desc; struct virtio_gpu_submit_post_dep *post_deps; u32 num_out_syncobjs = exbuf->num_out_syncobjs; size_t syncobj_stride = exbuf->syncobj_stride; int ret = 0, i; if (!num_out_syncobjs) return 0; post_deps = kvcalloc(num_out_syncobjs, sizeof(*post_deps), GFP_KERNEL); if (!post_deps) return -ENOMEM; for (i = 0; i < num_out_syncobjs; i++) { u64 address = exbuf->out_syncobjs + i * syncobj_stride; memset(&syncobj_desc, 0, sizeof(syncobj_desc)); if (copy_from_user(&syncobj_desc, u64_to_user_ptr(address), min(syncobj_stride, sizeof(syncobj_desc)))) { ret = -EFAULT; break; } post_deps[i].point = syncobj_desc.point; if (syncobj_desc.flags) { ret = -EINVAL; break; } if (syncobj_desc.point) { post_deps[i].chain = dma_fence_chain_alloc(); if (!post_deps[i].chain) { ret = -ENOMEM; break; } } post_deps[i].syncobj = drm_syncobj_find(submit->file, syncobj_desc.handle); if (!post_deps[i].syncobj) { kfree(post_deps[i].chain); ret = -EINVAL; break; } } if (ret) { virtio_gpu_free_post_deps(post_deps, i); return ret; } submit->num_out_syncobjs = num_out_syncobjs; submit->post_deps = post_deps; return 0; } static void virtio_gpu_process_post_deps(struct virtio_gpu_submit *submit) { struct virtio_gpu_submit_post_dep *post_deps = submit->post_deps; if (post_deps) { struct dma_fence *fence = &submit->out_fence->f; u32 i; for (i = 0; i < submit->num_out_syncobjs; i++) { if (post_deps[i].chain) { drm_syncobj_add_point(post_deps[i].syncobj, post_deps[i].chain, fence, post_deps[i].point); post_deps[i].chain = NULL; } else { drm_syncobj_replace_fence(post_deps[i].syncobj, fence); } } } } static int virtio_gpu_fence_event_create(struct drm_device *dev, struct drm_file *file, struct virtio_gpu_fence *fence, u32 ring_idx) { struct virtio_gpu_fence_event *e = NULL; int ret; e = kzalloc(sizeof(*e), GFP_KERNEL); if (!e) return -ENOMEM; e->event.type = VIRTGPU_EVENT_FENCE_SIGNALED; e->event.length = sizeof(e->event); ret = drm_event_reserve_init(dev, file, &e->base, &e->event); if (ret) { kfree(e); return ret; } fence->e = e; return 0; } static int virtio_gpu_init_submit_buflist(struct virtio_gpu_submit *submit) { struct drm_virtgpu_execbuffer *exbuf = submit->exbuf; u32 *bo_handles; if (!exbuf->num_bo_handles) return 0; bo_handles = kvmalloc_array(exbuf->num_bo_handles, sizeof(*bo_handles), GFP_KERNEL); if (!bo_handles) return -ENOMEM; if (copy_from_user(bo_handles, u64_to_user_ptr(exbuf->bo_handles), exbuf->num_bo_handles * sizeof(*bo_handles))) { kvfree(bo_handles); return -EFAULT; } submit->buflist = virtio_gpu_array_from_handles(submit->file, bo_handles, exbuf->num_bo_handles); if (!submit->buflist) { kvfree(bo_handles); return -ENOENT; } kvfree(bo_handles); return 0; } static void virtio_gpu_cleanup_submit(struct virtio_gpu_submit *submit) { virtio_gpu_reset_syncobjs(submit->in_syncobjs, submit->num_in_syncobjs); virtio_gpu_free_syncobjs(submit->in_syncobjs, submit->num_in_syncobjs); virtio_gpu_free_post_deps(submit->post_deps, submit->num_out_syncobjs); if (!IS_ERR(submit->buf)) kvfree(submit->buf); if (submit->buflist) virtio_gpu_array_put_free(submit->buflist); if (submit->out_fence_fd >= 0) put_unused_fd(submit->out_fence_fd); if (submit->out_fence) dma_fence_put(&submit->out_fence->f); if (submit->sync_file) fput(submit->sync_file->file); } static void virtio_gpu_submit(struct virtio_gpu_submit *submit) { virtio_gpu_cmd_submit(submit->vgdev, submit->buf, submit->exbuf->size, submit->vfpriv->ctx_id, submit->buflist, submit->out_fence); virtio_gpu_notify(submit->vgdev); } static void virtio_gpu_complete_submit(struct virtio_gpu_submit *submit) { submit->buf = NULL; submit->buflist = NULL; submit->sync_file = NULL; submit->out_fence_fd = -1; } static int virtio_gpu_init_submit(struct virtio_gpu_submit *submit, struct drm_virtgpu_execbuffer *exbuf, struct drm_device *dev, struct drm_file *file, u64 fence_ctx, u32 ring_idx) { struct virtio_gpu_fpriv *vfpriv = file->driver_priv; struct virtio_gpu_device *vgdev = dev->dev_private; struct virtio_gpu_fence *out_fence; bool drm_fence_event; int err; memset(submit, 0, sizeof(*submit)); if ((exbuf->flags & VIRTGPU_EXECBUF_RING_IDX) && (vfpriv->ring_idx_mask & BIT_ULL(ring_idx))) drm_fence_event = true; else drm_fence_event = false; if ((exbuf->flags & VIRTGPU_EXECBUF_FENCE_FD_OUT) || exbuf->num_out_syncobjs || exbuf->num_bo_handles || drm_fence_event) out_fence = virtio_gpu_fence_alloc(vgdev, fence_ctx, ring_idx); else out_fence = NULL; if (drm_fence_event) { err = virtio_gpu_fence_event_create(dev, file, out_fence, ring_idx); if (err) { dma_fence_put(&out_fence->f); return err; } } submit->out_fence = out_fence; submit->fence_ctx = fence_ctx; submit->ring_idx = ring_idx; submit->out_fence_fd = -1; submit->vfpriv = vfpriv; submit->vgdev = vgdev; submit->exbuf = exbuf; submit->file = file; err = virtio_gpu_init_submit_buflist(submit); if (err) return err; submit->buf = vmemdup_user(u64_to_user_ptr(exbuf->command), exbuf->size); if (IS_ERR(submit->buf)) return PTR_ERR(submit->buf); if (exbuf->flags & VIRTGPU_EXECBUF_FENCE_FD_OUT) { err = get_unused_fd_flags(O_CLOEXEC); if (err < 0) return err; submit->out_fence_fd = err; submit->sync_file = sync_file_create(&out_fence->f); if (!submit->sync_file) return -ENOMEM; } return 0; } static int virtio_gpu_wait_in_fence(struct virtio_gpu_submit *submit) { int ret = 0; if (submit->exbuf->flags & VIRTGPU_EXECBUF_FENCE_FD_IN) { struct dma_fence *in_fence = sync_file_get_fence(submit->exbuf->fence_fd); if (!in_fence) return -EINVAL; /* * Wait if the fence is from a foreign context, or if the * fence array contains any fence from a foreign context. */ ret = virtio_gpu_dma_fence_wait(submit, in_fence); dma_fence_put(in_fence); } return ret; } static void virtio_gpu_install_out_fence_fd(struct virtio_gpu_submit *submit) { if (submit->sync_file) { submit->exbuf->fence_fd = submit->out_fence_fd; fd_install(submit->out_fence_fd, submit->sync_file->file); } } static int virtio_gpu_lock_buflist(struct virtio_gpu_submit *submit) { if (submit->buflist) return virtio_gpu_array_lock_resv(submit->buflist); return 0; } int virtio_gpu_execbuffer_ioctl(struct drm_device *dev, void *data, struct drm_file *file) { struct virtio_gpu_device *vgdev = dev->dev_private; struct virtio_gpu_fpriv *vfpriv = file->driver_priv; u64 fence_ctx = vgdev->fence_drv.context; struct drm_virtgpu_execbuffer *exbuf = data; struct virtio_gpu_submit submit; u32 ring_idx = 0; int ret = -EINVAL; if (!vgdev->has_virgl_3d) return -ENOSYS; if (exbuf->flags & ~VIRTGPU_EXECBUF_FLAGS) return ret; if (exbuf->flags & VIRTGPU_EXECBUF_RING_IDX) { if (exbuf->ring_idx >= vfpriv->num_rings) return ret; if (!vfpriv->base_fence_ctx) return ret; fence_ctx = vfpriv->base_fence_ctx; ring_idx = exbuf->ring_idx; } virtio_gpu_create_context(dev, file); ret = virtio_gpu_init_submit(&submit, exbuf, dev, file, fence_ctx, ring_idx); if (ret) goto cleanup; ret = virtio_gpu_parse_post_deps(&submit); if (ret) goto cleanup; ret = virtio_gpu_parse_deps(&submit); if (ret) goto cleanup; /* * Await in-fences in the end of the job submission path to * optimize the path by proceeding directly to the submission * to virtio after the waits. */ ret = virtio_gpu_wait_in_fence(&submit); if (ret) goto cleanup; ret = virtio_gpu_lock_buflist(&submit); if (ret) goto cleanup; virtio_gpu_submit(&submit); /* * Set up usr-out data after submitting the job to optimize * the job submission path. */ virtio_gpu_install_out_fence_fd(&submit); virtio_gpu_process_post_deps(&submit); virtio_gpu_complete_submit(&submit); cleanup: virtio_gpu_cleanup_submit(&submit); return ret; }