/* * Copyright (C) 2017 Rob Clark * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. * * Authors: * Rob Clark */ #include "util/u_inlines.h" #include "util/u_memory.h" #include "freedreno_context.h" #include "freedreno_query_acc.h" #include "freedreno_resource.h" #include "freedreno_util.h" static void fd_acc_destroy_query(struct fd_context *ctx, struct fd_query *q) assert_dt { struct fd_acc_query *aq = fd_acc_query(q); DBG("%p", q); pipe_resource_reference(&aq->prsc, NULL); list_del(&aq->node); free(aq->query_data); free(aq); } static void realloc_query_bo(struct fd_context *ctx, struct fd_acc_query *aq) { struct fd_resource *rsc; void *map; pipe_resource_reference(&aq->prsc, NULL); aq->prsc = pipe_buffer_create(&ctx->screen->base, PIPE_BIND_QUERY_BUFFER, 0, 0x1000); /* don't assume the buffer is zero-initialized: */ rsc = fd_resource(aq->prsc); fd_bo_cpu_prep(rsc->bo, ctx->pipe, FD_BO_PREP_WRITE); map = fd_bo_map(rsc->bo); memset(map, 0, aq->size); fd_bo_cpu_fini(rsc->bo); } static void fd_acc_query_pause(struct fd_acc_query *aq) assert_dt { const struct fd_acc_sample_provider *p = aq->provider; if (!aq->batch) return; fd_batch_needs_flush(aq->batch); p->pause(aq, aq->batch); aq->batch = NULL; } static void fd_acc_query_resume(struct fd_acc_query *aq, struct fd_batch *batch) assert_dt { const struct fd_acc_sample_provider *p = aq->provider; aq->batch = batch; fd_batch_needs_flush(aq->batch); p->resume(aq, aq->batch); fd_screen_lock(batch->ctx->screen); fd_batch_resource_write(batch, fd_resource(aq->prsc)); fd_screen_unlock(batch->ctx->screen); } static void fd_acc_begin_query(struct fd_context *ctx, struct fd_query *q) assert_dt { struct fd_acc_query *aq = fd_acc_query(q); DBG("%p", q); /* ->begin_query() discards previous results, so realloc bo: */ realloc_query_bo(ctx, aq); /* Signal that we need to update the active queries on the next draw */ ctx->update_active_queries = true; /* add to active list: */ assert(list_is_empty(&aq->node)); list_addtail(&aq->node, &ctx->acc_active_queries); /* TIMESTAMP/GPU_FINISHED and don't do normal bracketing at draw time, we * need to just emit the capture at this moment. */ if (skip_begin_query(q->type)) { struct fd_batch *batch = fd_context_batch_locked(ctx); fd_acc_query_resume(aq, batch); fd_batch_unlock_submit(batch); fd_batch_reference(&batch, NULL); } } static void fd_acc_end_query(struct fd_context *ctx, struct fd_query *q) assert_dt { struct fd_acc_query *aq = fd_acc_query(q); DBG("%p", q); fd_acc_query_pause(aq); /* remove from active list: */ list_delinit(&aq->node); } static bool fd_acc_get_query_result(struct fd_context *ctx, struct fd_query *q, bool wait, union pipe_query_result *result) { struct fd_acc_query *aq = fd_acc_query(q); const struct fd_acc_sample_provider *p = aq->provider; struct fd_resource *rsc = fd_resource(aq->prsc); DBG("%p: wait=%d", q, wait); assert(list_is_empty(&aq->node)); /* ARB_occlusion_query says: * * "Querying the state for a given occlusion query forces that * occlusion query to complete within a finite amount of time." * * So, regardless of whether we are supposed to wait or not, we do need to * flush now. */ if (fd_get_query_result_in_driver_thread(q)) { tc_assert_driver_thread(ctx->tc); fd_context_access_begin(ctx); fd_bc_flush_writer(ctx, rsc); fd_context_access_end(ctx); } if (!wait) { int ret = fd_resource_wait( ctx, rsc, FD_BO_PREP_READ | FD_BO_PREP_NOSYNC | FD_BO_PREP_FLUSH); if (ret) return false; } else { fd_resource_wait(ctx, rsc, FD_BO_PREP_READ); } void *ptr = fd_bo_map(rsc->bo); p->result(aq, ptr, result); fd_bo_cpu_fini(rsc->bo); return true; } static const struct fd_query_funcs acc_query_funcs = { .destroy_query = fd_acc_destroy_query, .begin_query = fd_acc_begin_query, .end_query = fd_acc_end_query, .get_query_result = fd_acc_get_query_result, }; struct fd_query * fd_acc_create_query2(struct fd_context *ctx, unsigned query_type, unsigned index, const struct fd_acc_sample_provider *provider) { struct fd_acc_query *aq; struct fd_query *q; aq = CALLOC_STRUCT(fd_acc_query); if (!aq) return NULL; DBG("%p: query_type=%u", aq, query_type); aq->provider = provider; aq->size = provider->size; list_inithead(&aq->node); q = &aq->base; q->funcs = &acc_query_funcs; q->type = query_type; q->index = index; return q; } struct fd_query * fd_acc_create_query(struct fd_context *ctx, unsigned query_type, unsigned index) { int idx = pidx(query_type); if ((idx < 0) || !ctx->acc_sample_providers[idx]) return NULL; return fd_acc_create_query2(ctx, query_type, index, ctx->acc_sample_providers[idx]); } /* Called at clear/draw/blit time to enable/disable the appropriate queries in * the batch (and transfer active querying between batches in the case of * batch reordering). */ void fd_acc_query_update_batch(struct fd_batch *batch, bool disable_all) { struct fd_context *ctx = batch->ctx; if (disable_all || ctx->update_active_queries) { struct fd_acc_query *aq; LIST_FOR_EACH_ENTRY (aq, &ctx->acc_active_queries, node) { bool batch_change = aq->batch != batch; bool was_active = aq->batch != NULL; bool now_active = !disable_all && (ctx->active_queries || aq->provider->always); if (was_active && (!now_active || batch_change)) fd_acc_query_pause(aq); if (now_active && (!was_active || batch_change)) fd_acc_query_resume(aq, batch); } } ctx->update_active_queries = false; } void fd_acc_query_register_provider(struct pipe_context *pctx, const struct fd_acc_sample_provider *provider) { struct fd_context *ctx = fd_context(pctx); int idx = pidx(provider->query_type); assert((0 <= idx) && (idx < MAX_HW_SAMPLE_PROVIDERS)); assert(!ctx->acc_sample_providers[idx]); ctx->acc_sample_providers[idx] = provider; }