| /* |
| * © Copyright 2019 Collabora, Ltd. |
| * Copyright 2019 Alyssa Rosenzweig |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a |
| * copy of this software and associated documentation files (the "Software"), |
| * to deal in the Software without restriction, including without limitation |
| * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| * and/or sell copies of the Software, and to permit persons to whom the |
| * Software is furnished to do so, subject to the following conditions: |
| * |
| * The above copyright notice and this permission notice (including the next |
| * paragraph) shall be included in all copies or substantial portions of the |
| * Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
| * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
| * SOFTWARE. |
| * |
| */ |
| |
| #include <fcntl.h> |
| #include <xf86drm.h> |
| |
| #include "drm-uapi/panfrost_drm.h" |
| |
| #include "util/u_memory.h" |
| #include "util/os_time.h" |
| #include "os/os_mman.h" |
| |
| #include "pan_screen.h" |
| #include "pan_resource.h" |
| #include "pan_context.h" |
| #include "pan_util.h" |
| #include "pandecode/decode.h" |
| |
| void |
| panfrost_drm_mmap_bo(struct panfrost_screen *screen, struct panfrost_bo *bo) |
| { |
| struct drm_panfrost_mmap_bo mmap_bo = { .handle = bo->gem_handle }; |
| int ret; |
| |
| if (bo->cpu) |
| return; |
| |
| ret = drmIoctl(screen->fd, DRM_IOCTL_PANFROST_MMAP_BO, &mmap_bo); |
| if (ret) { |
| fprintf(stderr, "DRM_IOCTL_PANFROST_MMAP_BO failed: %m\n"); |
| assert(0); |
| } |
| |
| bo->cpu = os_mmap(NULL, bo->size, PROT_READ | PROT_WRITE, MAP_SHARED, |
| screen->fd, mmap_bo.offset); |
| if (bo->cpu == MAP_FAILED) { |
| fprintf(stderr, "mmap failed: %p %m\n", bo->cpu); |
| assert(0); |
| } |
| |
| /* Record the mmap if we're tracing */ |
| if (pan_debug & PAN_DBG_TRACE) |
| pandecode_inject_mmap(bo->gpu, bo->cpu, bo->size, NULL); |
| } |
| |
| static void |
| panfrost_drm_munmap_bo(struct panfrost_screen *screen, struct panfrost_bo *bo) |
| { |
| if (!bo->cpu) |
| return; |
| |
| if (os_munmap((void *) (uintptr_t)bo->cpu, bo->size)) { |
| perror("munmap"); |
| abort(); |
| } |
| |
| bo->cpu = NULL; |
| } |
| |
| struct panfrost_bo * |
| panfrost_drm_create_bo(struct panfrost_screen *screen, size_t size, |
| uint32_t flags) |
| { |
| struct panfrost_bo *bo; |
| |
| /* Kernel will fail (confusingly) with EPERM otherwise */ |
| assert(size > 0); |
| |
| /* To maximize BO cache usage, don't allocate tiny BOs */ |
| size = MAX2(size, 4096); |
| |
| /* GROWABLE BOs cannot be mmapped */ |
| if (flags & PAN_ALLOCATE_GROWABLE) |
| assert(flags & PAN_ALLOCATE_INVISIBLE); |
| |
| unsigned translated_flags = 0; |
| |
| if (screen->kernel_version->version_major > 1 || |
| screen->kernel_version->version_minor >= 1) { |
| if (flags & PAN_ALLOCATE_GROWABLE) |
| translated_flags |= PANFROST_BO_HEAP; |
| if (!(flags & PAN_ALLOCATE_EXECUTE)) |
| translated_flags |= PANFROST_BO_NOEXEC; |
| } |
| |
| struct drm_panfrost_create_bo create_bo = { |
| .size = size, |
| .flags = translated_flags, |
| }; |
| |
| /* Before creating a BO, we first want to check the cache */ |
| |
| bo = panfrost_bo_cache_fetch(screen, size, flags); |
| |
| if (bo == NULL) { |
| /* Otherwise, the cache misses and we need to allocate a BO fresh from |
| * the kernel */ |
| |
| int ret; |
| |
| ret = drmIoctl(screen->fd, DRM_IOCTL_PANFROST_CREATE_BO, &create_bo); |
| if (ret) { |
| fprintf(stderr, "DRM_IOCTL_PANFROST_CREATE_BO failed: %m\n"); |
| assert(0); |
| } |
| |
| /* We have a BO allocated from the kernel; fill in the userspace |
| * version */ |
| |
| bo = rzalloc(screen, struct panfrost_bo); |
| bo->size = create_bo.size; |
| bo->gpu = create_bo.offset; |
| bo->gem_handle = create_bo.handle; |
| bo->flags = flags; |
| } |
| |
| /* Only mmap now if we know we need to. For CPU-invisible buffers, we |
| * never map since we don't care about their contents; they're purely |
| * for GPU-internal use. But we do trace them anyway. */ |
| |
| if (!(flags & (PAN_ALLOCATE_INVISIBLE | PAN_ALLOCATE_DELAY_MMAP))) |
| panfrost_drm_mmap_bo(screen, bo); |
| else if (flags & PAN_ALLOCATE_INVISIBLE) { |
| if (pan_debug & PAN_DBG_TRACE) |
| pandecode_inject_mmap(bo->gpu, NULL, bo->size, NULL); |
| } |
| |
| pipe_reference_init(&bo->reference, 1); |
| return bo; |
| } |
| |
| void |
| panfrost_drm_release_bo(struct panfrost_screen *screen, struct panfrost_bo *bo, bool cacheable) |
| { |
| if (!bo) |
| return; |
| |
| struct drm_gem_close gem_close = { .handle = bo->gem_handle }; |
| int ret; |
| |
| /* Rather than freeing the BO now, we'll cache the BO for later |
| * allocations if we're allowed to */ |
| |
| panfrost_drm_munmap_bo(screen, bo); |
| |
| if (cacheable) { |
| bool cached = panfrost_bo_cache_put(screen, bo); |
| |
| if (cached) |
| return; |
| } |
| |
| /* Otherwise, if the BO wasn't cached, we'll legitimately free the BO */ |
| |
| ret = drmIoctl(screen->fd, DRM_IOCTL_GEM_CLOSE, &gem_close); |
| if (ret) { |
| fprintf(stderr, "DRM_IOCTL_GEM_CLOSE failed: %m\n"); |
| assert(0); |
| } |
| |
| ralloc_free(bo); |
| } |
| |
| void |
| panfrost_drm_allocate_slab(struct panfrost_screen *screen, |
| struct panfrost_memory *mem, |
| size_t pages, |
| bool same_va, |
| int extra_flags, |
| int commit_count, |
| int extent) |
| { |
| // TODO cache allocations |
| // TODO properly handle errors |
| // TODO take into account extra_flags |
| mem->bo = panfrost_drm_create_bo(screen, pages * 4096, extra_flags); |
| mem->stack_bottom = 0; |
| } |
| |
| void |
| panfrost_drm_free_slab(struct panfrost_screen *screen, struct panfrost_memory *mem) |
| { |
| panfrost_bo_unreference(&screen->base, mem->bo); |
| mem->bo = NULL; |
| } |
| |
| struct panfrost_bo * |
| panfrost_drm_import_bo(struct panfrost_screen *screen, int fd) |
| { |
| struct panfrost_bo *bo = rzalloc(screen, struct panfrost_bo); |
| struct drm_panfrost_get_bo_offset get_bo_offset = {0,}; |
| ASSERTED int ret; |
| unsigned gem_handle; |
| |
| ret = drmPrimeFDToHandle(screen->fd, fd, &gem_handle); |
| assert(!ret); |
| |
| get_bo_offset.handle = gem_handle; |
| ret = drmIoctl(screen->fd, DRM_IOCTL_PANFROST_GET_BO_OFFSET, &get_bo_offset); |
| assert(!ret); |
| |
| bo->gem_handle = gem_handle; |
| bo->gpu = (mali_ptr) get_bo_offset.offset; |
| bo->size = lseek(fd, 0, SEEK_END); |
| assert(bo->size > 0); |
| pipe_reference_init(&bo->reference, 1); |
| |
| // TODO map and unmap on demand? |
| panfrost_drm_mmap_bo(screen, bo); |
| return bo; |
| } |
| |
| int |
| panfrost_drm_export_bo(struct panfrost_screen *screen, const struct panfrost_bo *bo) |
| { |
| struct drm_prime_handle args = { |
| .handle = bo->gem_handle, |
| .flags = DRM_CLOEXEC, |
| }; |
| |
| int ret = drmIoctl(screen->fd, DRM_IOCTL_PRIME_HANDLE_TO_FD, &args); |
| if (ret == -1) |
| return -1; |
| |
| return args.fd; |
| } |
| |
| static int |
| panfrost_drm_submit_job(struct panfrost_context *ctx, u64 job_desc, int reqs) |
| { |
| struct pipe_context *gallium = (struct pipe_context *) ctx; |
| struct panfrost_screen *screen = pan_screen(gallium->screen); |
| struct panfrost_job *job = panfrost_get_job_for_fbo(ctx); |
| struct drm_panfrost_submit submit = {0,}; |
| int *bo_handles, ret; |
| |
| submit.in_syncs = (u64) (uintptr_t) &ctx->out_sync; |
| submit.in_sync_count = 1; |
| |
| submit.out_sync = ctx->out_sync; |
| |
| submit.jc = job_desc; |
| submit.requirements = reqs; |
| |
| bo_handles = calloc(job->bos->entries, sizeof(*bo_handles)); |
| assert(bo_handles); |
| |
| set_foreach(job->bos, entry) { |
| struct panfrost_bo *bo = (struct panfrost_bo *)entry->key; |
| assert(bo->gem_handle > 0); |
| bo_handles[submit.bo_handle_count++] = bo->gem_handle; |
| } |
| |
| submit.bo_handles = (u64) (uintptr_t) bo_handles; |
| ret = drmIoctl(screen->fd, DRM_IOCTL_PANFROST_SUBMIT, &submit); |
| free(bo_handles); |
| if (ret) { |
| fprintf(stderr, "Error submitting: %m\n"); |
| return errno; |
| } |
| |
| /* Trace the job if we're doing that */ |
| if (pan_debug & PAN_DBG_TRACE) { |
| /* Wait so we can get errors reported back */ |
| drmSyncobjWait(screen->fd, &ctx->out_sync, 1, INT64_MAX, 0, NULL); |
| pandecode_jc(submit.jc, FALSE); |
| } |
| |
| return 0; |
| } |
| |
| int |
| panfrost_drm_submit_vs_fs_job(struct panfrost_context *ctx, bool has_draws, bool is_scanout) |
| { |
| int ret = 0; |
| |
| struct panfrost_job *job = panfrost_get_job_for_fbo(ctx); |
| |
| /* TODO: Add here the transient pools */ |
| panfrost_job_add_bo(job, ctx->scratchpad.bo); |
| panfrost_job_add_bo(job, ctx->tiler_heap.bo); |
| panfrost_job_add_bo(job, job->polygon_list); |
| |
| if (job->first_job.gpu) { |
| ret = panfrost_drm_submit_job(ctx, job->first_job.gpu, 0); |
| assert(!ret); |
| } |
| |
| if (job->first_tiler.gpu || job->clear) { |
| ret = panfrost_drm_submit_job(ctx, panfrost_fragment_job(ctx, has_draws), PANFROST_JD_REQ_FS); |
| assert(!ret); |
| } |
| |
| return ret; |
| } |
| |
| static struct panfrost_fence * |
| panfrost_fence_create(struct panfrost_context *ctx) |
| { |
| struct pipe_context *gallium = (struct pipe_context *) ctx; |
| struct panfrost_screen *screen = pan_screen(gallium->screen); |
| struct panfrost_fence *f = calloc(1, sizeof(*f)); |
| if (!f) |
| return NULL; |
| |
| /* Snapshot the last Panfrost's rendering's out fence. We'd rather have |
| * another syncobj instead of a sync file, but this is all we get. |
| * (HandleToFD/FDToHandle just gives you another syncobj ID for the |
| * same syncobj). |
| */ |
| drmSyncobjExportSyncFile(screen->fd, ctx->out_sync, &f->fd); |
| if (f->fd == -1) { |
| fprintf(stderr, "export failed: %m\n"); |
| free(f); |
| return NULL; |
| } |
| |
| pipe_reference_init(&f->reference, 1); |
| |
| return f; |
| } |
| |
| void |
| panfrost_drm_force_flush_fragment(struct panfrost_context *ctx, |
| struct pipe_fence_handle **fence) |
| { |
| struct pipe_context *gallium = (struct pipe_context *) ctx; |
| struct panfrost_screen *screen = pan_screen(gallium->screen); |
| |
| if (!screen->last_fragment_flushed) { |
| drmSyncobjWait(screen->fd, &ctx->out_sync, 1, INT64_MAX, 0, NULL); |
| screen->last_fragment_flushed = true; |
| |
| /* The job finished up, so we're safe to clean it up now */ |
| panfrost_free_job(ctx, screen->last_job); |
| } |
| |
| if (fence) { |
| struct panfrost_fence *f = panfrost_fence_create(ctx); |
| gallium->screen->fence_reference(gallium->screen, fence, NULL); |
| *fence = (struct pipe_fence_handle *)f; |
| } |
| } |
| |
| unsigned |
| panfrost_drm_query_gpu_version(struct panfrost_screen *screen) |
| { |
| struct drm_panfrost_get_param get_param = {0,}; |
| ASSERTED int ret; |
| |
| get_param.param = DRM_PANFROST_PARAM_GPU_PROD_ID; |
| ret = drmIoctl(screen->fd, DRM_IOCTL_PANFROST_GET_PARAM, &get_param); |
| assert(!ret); |
| |
| return get_param.value; |
| } |
| |
| int |
| panfrost_drm_init_context(struct panfrost_context *ctx) |
| { |
| struct pipe_context *gallium = (struct pipe_context *) ctx; |
| struct panfrost_screen *screen = pan_screen(gallium->screen); |
| |
| return drmSyncobjCreate(screen->fd, DRM_SYNCOBJ_CREATE_SIGNALED, |
| &ctx->out_sync); |
| } |
| |
| void |
| panfrost_drm_fence_reference(struct pipe_screen *screen, |
| struct pipe_fence_handle **ptr, |
| struct pipe_fence_handle *fence) |
| { |
| struct panfrost_fence **p = (struct panfrost_fence **)ptr; |
| struct panfrost_fence *f = (struct panfrost_fence *)fence; |
| struct panfrost_fence *old = *p; |
| |
| if (pipe_reference(&(*p)->reference, &f->reference)) { |
| close(old->fd); |
| free(old); |
| } |
| *p = f; |
| } |
| |
| boolean |
| panfrost_drm_fence_finish(struct pipe_screen *pscreen, |
| struct pipe_context *ctx, |
| struct pipe_fence_handle *fence, |
| uint64_t timeout) |
| { |
| struct panfrost_screen *screen = pan_screen(pscreen); |
| struct panfrost_fence *f = (struct panfrost_fence *)fence; |
| int ret; |
| |
| unsigned syncobj; |
| ret = drmSyncobjCreate(screen->fd, 0, &syncobj); |
| if (ret) { |
| fprintf(stderr, "Failed to create syncobj to wait on: %m\n"); |
| return false; |
| } |
| |
| ret = drmSyncobjImportSyncFile(screen->fd, syncobj, f->fd); |
| if (ret) { |
| fprintf(stderr, "Failed to import fence to syncobj: %m\n"); |
| return false; |
| } |
| |
| uint64_t abs_timeout = os_time_get_absolute_timeout(timeout); |
| if (abs_timeout == OS_TIMEOUT_INFINITE) |
| abs_timeout = INT64_MAX; |
| |
| ret = drmSyncobjWait(screen->fd, &syncobj, 1, abs_timeout, 0, NULL); |
| |
| drmSyncobjDestroy(screen->fd, syncobj); |
| |
| return ret >= 0; |
| } |