/* * Copyright © 2019 Raspberry Pi * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS * IN THE SOFTWARE. */ #include "v3dv_private.h" #include "drm-uapi/v3d_drm.h" #include "broadcom/clif/clif_dump.h" #include static void v3dv_clif_dump(struct v3dv_device *device, struct v3dv_job *job, struct drm_v3d_submit_cl *submit) { if (!(V3D_DEBUG & (V3D_DEBUG_CL | V3D_DEBUG_CLIF))) return; struct clif_dump *clif = clif_dump_init(&device->devinfo, stderr, V3D_DEBUG & V3D_DEBUG_CL); set_foreach(job->bos, entry) { struct v3dv_bo *bo = (void *)entry->key; char *name = ralloc_asprintf(NULL, "%s_0x%x", "" /* bo->name */ , bo->offset); v3dv_bo_map(device, bo, bo->size); clif_dump_add_bo(clif, name, bo->offset, bo->size, bo->map); ralloc_free(name); } clif_dump(clif, submit); clif_dump_destroy(clif); } static VkResult process_semaphores_to_signal(struct v3dv_device *device, uint32_t count, const VkSemaphore *sems) { if (count == 0) return VK_SUCCESS; for (uint32_t i = 0; i < count; i++) { struct v3dv_semaphore *sem = v3dv_semaphore_from_handle(sems[i]); if (sem->fd >= 0) close(sem->fd); sem->fd = -1; int fd; drmSyncobjExportSyncFile(device->fd, device->last_job_sync, &fd); if (fd == -1) return VK_ERROR_DEVICE_LOST; int ret = drmSyncobjImportSyncFile(device->fd, sem->sync, fd); if (ret) return VK_ERROR_DEVICE_LOST; sem->fd = fd; } return VK_SUCCESS; } static VkResult job_submit(struct v3dv_job *job, bool do_wait) { assert(job); struct drm_v3d_submit_cl submit; /* RCL jobs don't start until the previous RCL job has finished so we don't * really need to add a fence for those, however, we might need to wait on a * CSD or TFU job, which are not serialized. * * FIXME: for now, if we are asked to wait on any semaphores, we just wait * on the last job we submitted. In the future we might want to pass the * actual syncobj of the wait semaphores so we don't block on the last RCL * if we only need to wait for a previous CSD or TFU, for example, but * we would have to extend our kernel interface to support the case where * we have more than one semaphore to wait on. */ submit.in_sync_rcl = do_wait ? job->cmd_buffer->device->last_job_sync : 0; /* Update the sync object for the last rendering by this device. */ submit.out_sync = job->cmd_buffer->device->last_job_sync; submit.bcl_start = job->bcl.bo->offset; submit.bcl_end = job->bcl.bo->offset + v3dv_cl_offset(&job->bcl); submit.rcl_start = job->rcl.bo->offset; submit.rcl_end = job->rcl.bo->offset + v3dv_cl_offset(&job->rcl); submit.flags = 0; /* FIXME: we already know that we support cache flush, as we only support * hw that supports that, but would be better to just DRM-ask it */ if (job->tmu_dirty_rcl) submit.flags |= DRM_V3D_SUBMIT_CL_FLUSH_CACHE; submit.qma = job->tile_alloc->offset; submit.qms = job->tile_alloc->size; submit.qts = job->tile_state->offset; submit.bo_handle_count = job->bo_count; uint32_t *bo_handles = (uint32_t *) malloc(sizeof(uint32_t) * MAX2(4, submit.bo_handle_count * 2)); uint32_t bo_idx = 0; set_foreach(job->bos, entry) { struct v3dv_bo *bo = (struct v3dv_bo *)entry->key; bo_handles[bo_idx++] = bo->handle; } assert(bo_idx == submit.bo_handle_count); submit.bo_handles = (uintptr_t)(void *)bo_handles; struct v3dv_device *device = job->cmd_buffer->device; v3dv_clif_dump(device, job, &submit); int ret = v3dv_ioctl(device->fd, DRM_IOCTL_V3D_SUBMIT_CL, &submit); static bool warned = false; if (ret && !warned) { fprintf(stderr, "Draw call returned %s. Expect corruption.\n", strerror(errno)); warned = true; } free(bo_handles); if (ret) return VK_ERROR_DEVICE_LOST; return VK_SUCCESS; } static VkResult queue_submit(struct v3dv_queue *queue, const VkSubmitInfo *pSubmit, VkFence fence) { /* FIXME */ assert(fence == 0); assert(pSubmit->commandBufferCount == 1); V3DV_FROM_HANDLE(v3dv_cmd_buffer, cmd_buffer, pSubmit->pCommandBuffers[0]); list_for_each_entry_safe(struct v3dv_job, job, &cmd_buffer->submit_jobs, list_link) { VkResult result = job_submit(job, pSubmit->waitSemaphoreCount > 0); if (result != VK_SUCCESS) return result; result = process_semaphores_to_signal(cmd_buffer->device, pSubmit->signalSemaphoreCount, pSubmit->pSignalSemaphores); if (result != VK_SUCCESS) return result; } return VK_SUCCESS; } VkResult v3dv_QueueSubmit(VkQueue _queue, uint32_t submitCount, const VkSubmitInfo* pSubmits, VkFence fence) { V3DV_FROM_HANDLE(v3dv_queue, queue, _queue); VkResult result = VK_SUCCESS; for (uint32_t i = 0; i < submitCount; i++) { result = queue_submit(queue, &pSubmits[i], fence); if (result != VK_SUCCESS) break; } return result; } VkResult v3dv_CreateSemaphore(VkDevice _device, const VkSemaphoreCreateInfo *pCreateInfo, const VkAllocationCallbacks *pAllocator, VkSemaphore *pSemaphore) { V3DV_FROM_HANDLE(v3dv_device, device, _device); assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_SEMAPHORE_CREATE_INFO); struct v3dv_semaphore *sem = vk_alloc2(&device->alloc, pAllocator, sizeof(struct v3dv_semaphore), 8, VK_SYSTEM_ALLOCATION_SCOPE_OBJECT); if (sem == NULL) return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY); sem->fd = -1; int ret = drmSyncobjCreate(device->fd, 0, &sem->sync); if (ret) { vk_free2(&device->alloc, pAllocator, sem); return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY); } *pSemaphore = v3dv_semaphore_to_handle(sem); return VK_SUCCESS; } void v3dv_DestroySemaphore(VkDevice _device, VkSemaphore semaphore, const VkAllocationCallbacks *pAllocator) { V3DV_FROM_HANDLE(v3dv_device, device, _device); V3DV_FROM_HANDLE(v3dv_semaphore, sem, semaphore); if (sem == NULL) return; drmSyncobjDestroy(device->fd, sem->sync); if (sem->fd != -1) close(sem->fd); vk_free2(&device->alloc, pAllocator, sem); }