summaryrefslogtreecommitdiff
path: root/src/gallium
diff options
context:
space:
mode:
authorRob Clark <robdclark@chromium.org>2021-06-20 08:58:42 -0700
committerMarge Bot <eric+marge@anholt.net>2021-06-21 18:45:23 +0000
commit5b4f670c1cf0361a7913d256e12544acf7536665 (patch)
tree750af22cdde390154462c9b2ec94c59324fd61fe /src/gallium
parent1a1eabd7d8bb740a0d349bc29b35e7691ca3d0d1 (diff)
freedreno/a6xx: Handle fb_read in sysmem path
Signed-off-by: Rob Clark <robdclark@chromium.org> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/11487>
Diffstat (limited to 'src/gallium')
-rw-r--r--src/gallium/drivers/freedreno/a6xx/fd6_emit.c20
-rw-r--r--src/gallium/drivers/freedreno/a6xx/fd6_gmem.c87
2 files changed, 85 insertions, 22 deletions
diff --git a/src/gallium/drivers/freedreno/a6xx/fd6_emit.c b/src/gallium/drivers/freedreno/a6xx/fd6_emit.c
index 88aef02c77d..1ca7af5d7fc 100644
--- a/src/gallium/drivers/freedreno/a6xx/fd6_emit.c
+++ b/src/gallium/drivers/freedreno/a6xx/fd6_emit.c
@@ -249,25 +249,13 @@ fd6_emit_fb_tex(struct fd_ringbuffer *state, struct fd_context *ctx) assert_dt
struct pipe_surface *psurf = pfb->cbufs[0];
struct fd_resource *rsc = fd_resource(psurf->texture);
- uint32_t texconst0 = fd6_tex_const_0(
- psurf->texture, psurf->u.tex.level, psurf->format, PIPE_SWIZZLE_X,
- PIPE_SWIZZLE_Y, PIPE_SWIZZLE_Z, PIPE_SWIZZLE_W);
-
- /* always TILE6_2 mode in GMEM.. which also means no swap: */
- texconst0 &=
- ~(A6XX_TEX_CONST_0_SWAP__MASK | A6XX_TEX_CONST_0_TILE_MODE__MASK);
- texconst0 |= A6XX_TEX_CONST_0_TILE_MODE(TILE6_2);
-
- OUT_RING(state, texconst0);
+ OUT_RINGP(state, 0, &ctx->batch->fb_read_patches); /* texconst0, patched in gmem emit */
OUT_RING(state, A6XX_TEX_CONST_1_WIDTH(pfb->width) |
A6XX_TEX_CONST_1_HEIGHT(pfb->height));
- OUT_RINGP(state, A6XX_TEX_CONST_2_TYPE(A6XX_TEX_2D),
- &ctx->batch->fb_read_patches);
+ OUT_RING(state, 0); /* texconst2, patched in gmem emit */
OUT_RING(state, A6XX_TEX_CONST_3_ARRAY_PITCH(rsc->layout.layer_size));
-
- OUT_RING(state, A6XX_TEX_CONST_4_BASE_LO(ctx->screen->gmem_base));
- OUT_RING(state, A6XX_TEX_CONST_5_BASE_HI(ctx->screen->gmem_base >> 32) |
- A6XX_TEX_CONST_5_DEPTH(1));
+ OUT_RING(state, 0); /* BASE_LO, patched in gmem emit */
+ OUT_RING(state, 0); /* BASE_HI, patched in gmem emit */
OUT_RING(state, 0); /* texconst6 */
OUT_RING(state, 0); /* texconst7 */
OUT_RING(state, 0); /* texconst8 */
diff --git a/src/gallium/drivers/freedreno/a6xx/fd6_gmem.c b/src/gallium/drivers/freedreno/a6xx/fd6_gmem.c
index 250b5ed7d8e..e5ee771b7c8 100644
--- a/src/gallium/drivers/freedreno/a6xx/fd6_gmem.c
+++ b/src/gallium/drivers/freedreno/a6xx/fd6_gmem.c
@@ -243,15 +243,89 @@ use_hw_binning(struct fd_batch *batch)
}
static void
-patch_fb_read(struct fd_batch *batch)
+patch_fb_read_gmem(struct fd_batch *batch)
{
+ unsigned num_patches = fd_patch_num_elements(&batch->fb_read_patches);
+ if (!num_patches)
+ return;
+
+ struct fd_screen *screen = batch->ctx->screen;
const struct fd_gmem_stateobj *gmem = batch->gmem_state;
+ struct pipe_framebuffer_state *pfb = &batch->framebuffer;
+ struct pipe_surface *psurf = pfb->cbufs[0];
+ uint32_t texconst0 = fd6_tex_const_0(
+ psurf->texture, psurf->u.tex.level, psurf->format, PIPE_SWIZZLE_X,
+ PIPE_SWIZZLE_Y, PIPE_SWIZZLE_Z, PIPE_SWIZZLE_W);
+
+ /* always TILE6_2 mode in GMEM.. which also means no swap: */
+ texconst0 &=
+ ~(A6XX_TEX_CONST_0_SWAP__MASK | A6XX_TEX_CONST_0_TILE_MODE__MASK);
+ texconst0 |= A6XX_TEX_CONST_0_TILE_MODE(TILE6_2);
+
+ for (unsigned i = 0; i < num_patches; i++) {
+ struct fd_cs_patch *patch = fd_patch_element(&batch->fb_read_patches, i);
+ patch->cs[0] = texconst0;
+ patch->cs[2] = A6XX_TEX_CONST_2_PITCH(gmem->bin_w * gmem->cbuf_cpp[0]) |
+ A6XX_TEX_CONST_2_TYPE(A6XX_TEX_2D);
+ patch->cs[4] = A6XX_TEX_CONST_4_BASE_LO(screen->gmem_base);
+ patch->cs[5] = A6XX_TEX_CONST_5_BASE_HI(screen->gmem_base >> 32) |
+ A6XX_TEX_CONST_5_DEPTH(1);
+ }
+ util_dynarray_clear(&batch->fb_read_patches);
+}
+
+static void
+patch_fb_read_sysmem(struct fd_batch *batch)
+{
+ unsigned num_patches = fd_patch_num_elements(&batch->fb_read_patches);
+ if (!num_patches)
+ return;
+
+ struct pipe_framebuffer_state *pfb = &batch->framebuffer;
+ struct pipe_surface *psurf = pfb->cbufs[0];
+ if (!psurf)
+ return;
- for (unsigned i = 0; i < fd_patch_num_elements(&batch->fb_read_patches);
- i++) {
+ struct fd_resource *rsc = fd_resource(psurf->texture);
+ unsigned lvl = psurf->u.tex.level;
+ unsigned layer = psurf->u.tex.first_layer;
+ bool ubwc_enabled = fd_resource_ubwc_enabled(rsc, lvl);
+ uint64_t iova = fd_bo_get_iova(rsc->bo) + fd_resource_offset(rsc, lvl, layer);
+ uint64_t ubwc_iova = fd_bo_get_iova(rsc->bo) + fd_resource_ubwc_offset(rsc, lvl, layer);
+ uint32_t texconst0 = fd6_tex_const_0(
+ psurf->texture, psurf->u.tex.level, psurf->format, PIPE_SWIZZLE_X,
+ PIPE_SWIZZLE_Y, PIPE_SWIZZLE_Z, PIPE_SWIZZLE_W);
+ uint32_t block_width, block_height;
+ fdl6_get_ubwc_blockwidth(&rsc->layout, &block_width, &block_height);
+
+ for (unsigned i = 0; i < num_patches; i++) {
struct fd_cs_patch *patch = fd_patch_element(&batch->fb_read_patches, i);
- *patch->cs =
- patch->val | A6XX_TEX_CONST_2_PITCH(gmem->bin_w * gmem->cbuf_cpp[0]);
+ patch->cs[0] = texconst0;
+ patch->cs[2] = A6XX_TEX_CONST_2_PITCH(fd_resource_pitch(rsc, lvl)) |
+ A6XX_TEX_CONST_2_TYPE(A6XX_TEX_2D);
+ /* This is cheating a bit, since we can't use OUT_RELOC() here.. but
+ * the render target will already have a reloc emitted for RB_MRT state,
+ * so we can get away with manually patching in the address here:
+ */
+ patch->cs[4] = A6XX_TEX_CONST_4_BASE_LO(iova);
+ patch->cs[5] = A6XX_TEX_CONST_5_BASE_HI(iova >> 32) |
+ A6XX_TEX_CONST_5_DEPTH(1);
+
+ if (!ubwc_enabled)
+ continue;
+
+ patch->cs[3] |= A6XX_TEX_CONST_3_FLAG;
+ patch->cs[7] = A6XX_TEX_CONST_7_FLAG_LO(ubwc_iova);
+ patch->cs[8] = A6XX_TEX_CONST_8_FLAG_HI(ubwc_iova >> 32);
+ patch->cs[9] = A6XX_TEX_CONST_9_FLAG_BUFFER_ARRAY_PITCH(
+ rsc->layout.ubwc_layer_size >> 2);
+ patch->cs[10] =
+ A6XX_TEX_CONST_10_FLAG_BUFFER_PITCH(
+ fdl_ubwc_pitch(&rsc->layout, lvl)) |
+ A6XX_TEX_CONST_10_FLAG_BUFFER_LOGW(util_logbase2_ceil(
+ DIV_ROUND_UP(u_minify(psurf->texture->width0, lvl), block_width))) |
+ A6XX_TEX_CONST_10_FLAG_BUFFER_LOGH(util_logbase2_ceil(
+ DIV_ROUND_UP(u_minify(psurf->texture->height0, lvl), block_height)));
}
util_dynarray_clear(&batch->fb_read_patches);
}
@@ -741,7 +815,7 @@ fd6_emit_tile_init(struct fd_batch *batch) assert_dt
emit_zs(ring, pfb->zsbuf, batch->gmem_state);
emit_mrt(ring, pfb, batch->gmem_state);
emit_msaa(ring, pfb->samples);
- patch_fb_read(batch);
+ patch_fb_read_gmem(batch);
if (use_hw_binning(batch)) {
/* enable stream-out during binning pass: */
@@ -1523,6 +1597,7 @@ fd6_emit_sysmem_prep(struct fd_batch *batch) assert_dt
emit_zs(ring, pfb->zsbuf, NULL);
emit_mrt(ring, pfb, NULL);
emit_msaa(ring, pfb->samples);
+ patch_fb_read_sysmem(batch);
update_render_cntl(batch, pfb, false);