| /* -*- mode: C; c-file-style: "k&r"; tab-width 4; indent-tabs-mode: t; -*- */ |
| |
| /* |
| * Copyright (C) 2014 Rob Clark <robclark@freedesktop.org> |
| * |
| * Permission is hereby granted, free of charge, to any person obtaining a |
| * copy of this software and associated documentation files (the "Software"), |
| * to deal in the Software without restriction, including without limitation |
| * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| * and/or sell copies of the Software, and to permit persons to whom the |
| * Software is furnished to do so, subject to the following conditions: |
| * |
| * The above copyright notice and this permission notice (including the next |
| * paragraph) shall be included in all copies or substantial portions of the |
| * Software. |
| * |
| * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
| * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
| * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
| * SOFTWARE. |
| * |
| * Authors: |
| * Rob Clark <robclark@freedesktop.org> |
| */ |
| |
| #include "freedreno_query_hw.h" |
| #include "freedreno_context.h" |
| #include "freedreno_util.h" |
| |
| #include "fd3_query.h" |
| #include "fd3_format.h" |
| |
| |
| struct fd_rb_samp_ctrs { |
| uint64_t ctr[16]; |
| }; |
| |
| /* |
| * Occlusion Query: |
| * |
| * OCCLUSION_COUNTER and OCCLUSION_PREDICATE differ only in how they |
| * interpret results |
| */ |
| |
| static struct fd_hw_sample * |
| occlusion_get_sample(struct fd_batch *batch, struct fd_ringbuffer *ring) |
| { |
| struct fd_hw_sample *samp = |
| fd_hw_sample_init(batch, sizeof(struct fd_rb_samp_ctrs)); |
| |
| /* Set RB_SAMPLE_COUNT_ADDR to samp->offset plus value of |
| * HW_QUERY_BASE_REG register: |
| */ |
| OUT_PKT3(ring, CP_SET_CONSTANT, 3); |
| OUT_RING(ring, CP_REG(REG_A3XX_RB_SAMPLE_COUNT_ADDR) | 0x80000000); |
| OUT_RING(ring, HW_QUERY_BASE_REG); |
| OUT_RING(ring, samp->offset); |
| |
| OUT_PKT0(ring, REG_A3XX_RB_SAMPLE_COUNT_CONTROL, 1); |
| OUT_RING(ring, A3XX_RB_SAMPLE_COUNT_CONTROL_COPY); |
| |
| OUT_PKT3(ring, CP_DRAW_INDX, 3); |
| OUT_RING(ring, 0x00000000); |
| OUT_RING(ring, DRAW(DI_PT_POINTLIST_PSIZE, DI_SRC_SEL_AUTO_INDEX, |
| INDEX_SIZE_IGN, USE_VISIBILITY, 0)); |
| OUT_RING(ring, 0); /* NumIndices */ |
| |
| fd_event_write(batch, ring, ZPASS_DONE); |
| |
| OUT_PKT0(ring, REG_A3XX_RBBM_PERFCTR_CTL, 1); |
| OUT_RING(ring, A3XX_RBBM_PERFCTR_CTL_ENABLE); |
| |
| OUT_PKT0(ring, REG_A3XX_VBIF_PERF_CNT_EN, 1); |
| OUT_RING(ring, A3XX_VBIF_PERF_CNT_EN_CNT0 | |
| A3XX_VBIF_PERF_CNT_EN_CNT1 | |
| A3XX_VBIF_PERF_CNT_EN_PWRCNT0 | |
| A3XX_VBIF_PERF_CNT_EN_PWRCNT1 | |
| A3XX_VBIF_PERF_CNT_EN_PWRCNT2); |
| |
| return samp; |
| } |
| |
| static uint64_t |
| count_samples(const struct fd_rb_samp_ctrs *start, |
| const struct fd_rb_samp_ctrs *end) |
| { |
| uint64_t n = 0; |
| unsigned i; |
| |
| /* not quite sure what all of these are, possibly different |
| * counters for each MRT render target: |
| */ |
| for (i = 0; i < 16; i += 4) |
| n += end->ctr[i] - start->ctr[i]; |
| |
| return n; |
| } |
| |
| static void |
| occlusion_counter_accumulate_result(struct fd_context *ctx, |
| const void *start, const void *end, |
| union pipe_query_result *result) |
| { |
| uint64_t n = count_samples(start, end); |
| result->u64 += n; |
| } |
| |
| static void |
| occlusion_predicate_accumulate_result(struct fd_context *ctx, |
| const void *start, const void *end, |
| union pipe_query_result *result) |
| { |
| uint64_t n = count_samples(start, end); |
| result->b |= (n > 0); |
| } |
| |
| static const struct fd_hw_sample_provider occlusion_counter = { |
| .query_type = PIPE_QUERY_OCCLUSION_COUNTER, |
| .active = FD_STAGE_DRAW, |
| .get_sample = occlusion_get_sample, |
| .accumulate_result = occlusion_counter_accumulate_result, |
| }; |
| |
| static const struct fd_hw_sample_provider occlusion_predicate = { |
| .query_type = PIPE_QUERY_OCCLUSION_PREDICATE, |
| .active = FD_STAGE_DRAW, |
| .get_sample = occlusion_get_sample, |
| .accumulate_result = occlusion_predicate_accumulate_result, |
| }; |
| |
| static const struct fd_hw_sample_provider occlusion_predicate_conservative = { |
| .query_type = PIPE_QUERY_OCCLUSION_PREDICATE_CONSERVATIVE, |
| .active = FD_STAGE_DRAW, |
| .get_sample = occlusion_get_sample, |
| .accumulate_result = occlusion_predicate_accumulate_result, |
| }; |
| |
| void fd3_query_context_init(struct pipe_context *pctx) |
| { |
| struct fd_context *ctx = fd_context(pctx); |
| |
| ctx->create_query = fd_hw_create_query; |
| ctx->query_prepare = fd_hw_query_prepare; |
| ctx->query_prepare_tile = fd_hw_query_prepare_tile; |
| ctx->query_set_stage = fd_hw_query_set_stage; |
| |
| fd_hw_query_register_provider(pctx, &occlusion_counter); |
| fd_hw_query_register_provider(pctx, &occlusion_predicate); |
| fd_hw_query_register_provider(pctx, &occlusion_predicate_conservative); |
| } |