summaryrefslogtreecommitdiff
path: root/src/mesa/drivers/dri/i965/brw_wm_surface_state.c
diff options
context:
space:
mode:
Diffstat (limited to 'src/mesa/drivers/dri/i965/brw_wm_surface_state.c')
-rw-r--r--src/mesa/drivers/dri/i965/brw_wm_surface_state.c1705
1 files changed, 0 insertions, 1705 deletions
diff --git a/src/mesa/drivers/dri/i965/brw_wm_surface_state.c b/src/mesa/drivers/dri/i965/brw_wm_surface_state.c
deleted file mode 100644
index 5caeda5239a..00000000000
--- a/src/mesa/drivers/dri/i965/brw_wm_surface_state.c
+++ /dev/null
@@ -1,1705 +0,0 @@
-/*
- Copyright (C) Intel Corp. 2006. All Rights Reserved.
- Intel funded Tungsten Graphics to
- develop this 3D driver.
-
- Permission is hereby granted, free of charge, to any person obtaining
- a copy of this software and associated documentation files (the
- "Software"), to deal in the Software without restriction, including
- without limitation the rights to use, copy, modify, merge, publish,
- distribute, sublicense, and/or sell copies of the Software, and to
- permit persons to whom the Software is furnished to do so, subject to
- the following conditions:
-
- The above copyright notice and this permission notice (including the
- next paragraph) shall be included in all copies or substantial
- portions of the Software.
-
- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
- IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
- LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
- OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
- WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
-
- **********************************************************************/
- /*
- * Authors:
- * Keith Whitwell <keithw@vmware.com>
- */
-
-
-#include "compiler/nir/nir.h"
-#include "main/context.h"
-#include "main/blend.h"
-#include "main/mtypes.h"
-#include "main/samplerobj.h"
-#include "main/shaderimage.h"
-#include "main/teximage.h"
-#include "program/prog_parameter.h"
-#include "program/prog_instruction.h"
-#include "main/framebuffer.h"
-#include "main/shaderapi.h"
-
-#include "isl/isl.h"
-
-#include "brw_mipmap_tree.h"
-#include "brw_batch.h"
-#include "brw_tex.h"
-#include "brw_fbo.h"
-#include "brw_buffer_objects.h"
-
-#include "brw_context.h"
-#include "brw_state.h"
-#include "brw_defines.h"
-#include "brw_wm.h"
-
-static const uint32_t wb_mocs[] = {
- [7] = GFX7_MOCS_L3,
- [8] = BDW_MOCS_WB,
- [9] = SKL_MOCS_WB,
- [10] = CNL_MOCS_WB,
- [11] = ICL_MOCS_WB,
-};
-
-static const uint32_t pte_mocs[] = {
- [7] = GFX7_MOCS_L3,
- [8] = BDW_MOCS_PTE,
- [9] = SKL_MOCS_PTE,
- [10] = CNL_MOCS_PTE,
- [11] = ICL_MOCS_PTE,
-};
-
-uint32_t
-brw_get_bo_mocs(const struct intel_device_info *devinfo, struct brw_bo *bo)
-{
- return (bo && bo->external ? pte_mocs : wb_mocs)[devinfo->ver];
-}
-
-static void
-get_isl_surf(struct brw_context *brw, struct brw_mipmap_tree *mt,
- GLenum target, struct isl_view *view,
- uint32_t *tile_x, uint32_t *tile_y,
- uint32_t *offset, struct isl_surf *surf)
-{
- *surf = mt->surf;
-
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- const enum isl_dim_layout dim_layout =
- get_isl_dim_layout(devinfo, mt->surf.tiling, target);
-
- surf->dim = get_isl_surf_dim(target);
-
- if (surf->dim_layout == dim_layout)
- return;
-
- /* The layout of the specified texture target is not compatible with the
- * actual layout of the miptree structure in memory -- You're entering
- * dangerous territory, this can only possibly work if you only intended
- * to access a single level and slice of the texture, and the hardware
- * supports the tile offset feature in order to allow non-tile-aligned
- * base offsets, since we'll have to point the hardware to the first
- * texel of the level instead of relying on the usual base level/layer
- * controls.
- */
- assert(devinfo->has_surface_tile_offset);
- assert(view->levels == 1 && view->array_len == 1);
- assert(*tile_x == 0 && *tile_y == 0);
-
- *offset += brw_miptree_get_tile_offsets(mt, view->base_level,
- view->base_array_layer,
- tile_x, tile_y);
-
- /* Minify the logical dimensions of the texture. */
- const unsigned l = view->base_level - mt->first_level;
- surf->logical_level0_px.width = minify(surf->logical_level0_px.width, l);
- surf->logical_level0_px.height = surf->dim <= ISL_SURF_DIM_1D ? 1 :
- minify(surf->logical_level0_px.height, l);
- surf->logical_level0_px.depth = surf->dim <= ISL_SURF_DIM_2D ? 1 :
- minify(surf->logical_level0_px.depth, l);
-
- /* Only the base level and layer can be addressed with the overridden
- * layout.
- */
- surf->logical_level0_px.array_len = 1;
- surf->levels = 1;
- surf->dim_layout = dim_layout;
-
- /* The requested slice of the texture is now at the base level and
- * layer.
- */
- view->base_level = 0;
- view->base_array_layer = 0;
-}
-
-static void
-brw_emit_surface_state(struct brw_context *brw,
- struct brw_mipmap_tree *mt,
- GLenum target, struct isl_view view,
- enum isl_aux_usage aux_usage,
- uint32_t *surf_offset, int surf_index,
- unsigned reloc_flags)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- uint32_t tile_x = mt->level[0].level_x;
- uint32_t tile_y = mt->level[0].level_y;
- uint32_t offset = mt->offset;
-
- struct isl_surf surf;
-
- get_isl_surf(brw, mt, target, &view, &tile_x, &tile_y, &offset, &surf);
-
- union isl_color_value clear_color = { .u32 = { 0, 0, 0, 0 } };
-
- struct brw_bo *aux_bo = NULL;
- struct isl_surf *aux_surf = NULL;
- uint64_t aux_offset = 0;
- struct brw_bo *clear_bo = NULL;
- uint64_t clear_offset = 0;
-
- if (aux_usage != ISL_AUX_USAGE_NONE) {
- aux_surf = &mt->aux_buf->surf;
- aux_bo = mt->aux_buf->bo;
- aux_offset = mt->aux_buf->offset;
-
- /* We only really need a clear color if we also have an auxiliary
- * surface. Without one, it does nothing.
- */
- clear_color = brw_miptree_get_clear_color(mt, &clear_bo, &clear_offset);
- }
-
- void *state = brw_state_batch(brw,
- brw->isl_dev.ss.size,
- brw->isl_dev.ss.align,
- surf_offset);
-
- isl_surf_fill_state(&brw->isl_dev, state, .surf = &surf, .view = &view,
- .address = brw_state_reloc(&brw->batch,
- *surf_offset + brw->isl_dev.ss.addr_offset,
- mt->bo, offset, reloc_flags),
- .aux_surf = aux_surf, .aux_usage = aux_usage,
- .aux_address = aux_offset,
- .mocs = brw_get_bo_mocs(devinfo, mt->bo),
- .clear_color = clear_color,
- .use_clear_address = clear_bo != NULL,
- .clear_address = clear_offset,
- .x_offset_sa = tile_x, .y_offset_sa = tile_y);
- if (aux_surf) {
- /* On gfx7 and prior, the upper 20 bits of surface state DWORD 6 are the
- * upper 20 bits of the GPU address of the MCS buffer; the lower 12 bits
- * contain other control information. Since buffer addresses are always
- * on 4k boundaries (and thus have their lower 12 bits zero), we can use
- * an ordinary reloc to do the necessary address translation.
- *
- * FIXME: move to the point of assignment.
- */
- assert((aux_offset & 0xfff) == 0);
-
- if (devinfo->ver >= 8) {
- uint64_t *aux_addr = state + brw->isl_dev.ss.aux_addr_offset;
- *aux_addr = brw_state_reloc(&brw->batch,
- *surf_offset +
- brw->isl_dev.ss.aux_addr_offset,
- aux_bo, *aux_addr,
- reloc_flags);
- } else {
- uint32_t *aux_addr = state + brw->isl_dev.ss.aux_addr_offset;
- *aux_addr = brw_state_reloc(&brw->batch,
- *surf_offset +
- brw->isl_dev.ss.aux_addr_offset,
- aux_bo, *aux_addr,
- reloc_flags);
-
- }
- }
-
- if (clear_bo != NULL) {
- /* Make sure the offset is aligned with a cacheline. */
- assert((clear_offset & 0x3f) == 0);
- uint64_t *clear_address =
- state + brw->isl_dev.ss.clear_color_state_offset;
- *clear_address = brw_state_reloc(&brw->batch,
- *surf_offset +
- brw->isl_dev.ss.clear_color_state_offset,
- clear_bo, *clear_address, reloc_flags);
- }
-}
-
-static uint32_t
-gfx6_update_renderbuffer_surface(struct brw_context *brw,
- struct gl_renderbuffer *rb,
- unsigned unit,
- uint32_t surf_index)
-{
- struct gl_context *ctx = &brw->ctx;
- struct brw_renderbuffer *irb = brw_renderbuffer(rb);
- struct brw_mipmap_tree *mt = irb->mt;
-
- assert(brw_render_target_supported(brw, rb));
-
- mesa_format rb_format = _mesa_get_render_format(ctx, brw_rb_format(irb));
- if (unlikely(!brw->mesa_format_supports_render[rb_format])) {
- _mesa_problem(ctx, "%s: renderbuffer format %s unsupported\n",
- __func__, _mesa_get_format_name(rb_format));
- }
- enum isl_format isl_format = brw->mesa_to_isl_render_format[rb_format];
-
- struct isl_view view = {
- .format = isl_format,
- .base_level = irb->mt_level - irb->mt->first_level,
- .levels = 1,
- .base_array_layer = irb->mt_layer,
- .array_len = MAX2(irb->layer_count, 1),
- .swizzle = ISL_SWIZZLE_IDENTITY,
- .usage = ISL_SURF_USAGE_RENDER_TARGET_BIT,
- };
-
- uint32_t offset;
- brw_emit_surface_state(brw, mt, mt->target, view,
- brw->draw_aux_usage[unit],
- &offset, surf_index,
- RELOC_WRITE);
- return offset;
-}
-
-GLuint
-translate_tex_target(GLenum target)
-{
- switch (target) {
- case GL_TEXTURE_1D:
- case GL_TEXTURE_1D_ARRAY_EXT:
- return BRW_SURFACE_1D;
-
- case GL_TEXTURE_RECTANGLE_NV:
- return BRW_SURFACE_2D;
-
- case GL_TEXTURE_2D:
- case GL_TEXTURE_2D_ARRAY_EXT:
- case GL_TEXTURE_EXTERNAL_OES:
- case GL_TEXTURE_2D_MULTISAMPLE:
- case GL_TEXTURE_2D_MULTISAMPLE_ARRAY:
- return BRW_SURFACE_2D;
-
- case GL_TEXTURE_3D:
- return BRW_SURFACE_3D;
-
- case GL_TEXTURE_CUBE_MAP:
- case GL_TEXTURE_CUBE_MAP_ARRAY:
- return BRW_SURFACE_CUBE;
-
- default:
- unreachable("not reached");
- }
-}
-
-uint32_t
-brw_get_surface_tiling_bits(enum isl_tiling tiling)
-{
- switch (tiling) {
- case ISL_TILING_X:
- return BRW_SURFACE_TILED;
- case ISL_TILING_Y0:
- return BRW_SURFACE_TILED | BRW_SURFACE_TILED_Y;
- default:
- return 0;
- }
-}
-
-
-uint32_t
-brw_get_surface_num_multisamples(unsigned num_samples)
-{
- if (num_samples > 1)
- return BRW_SURFACE_MULTISAMPLECOUNT_4;
- else
- return BRW_SURFACE_MULTISAMPLECOUNT_1;
-}
-
-/**
- * Compute the combination of DEPTH_TEXTURE_MODE and EXT_texture_swizzle
- * swizzling.
- */
-int
-brw_get_texture_swizzle(const struct gl_context *ctx,
- const struct gl_texture_object *t)
-{
- const struct gl_texture_image *img = t->Image[0][t->Attrib.BaseLevel];
-
- int swizzles[SWIZZLE_NIL + 1] = {
- SWIZZLE_X,
- SWIZZLE_Y,
- SWIZZLE_Z,
- SWIZZLE_W,
- SWIZZLE_ZERO,
- SWIZZLE_ONE,
- SWIZZLE_NIL
- };
-
- if (img->_BaseFormat == GL_DEPTH_COMPONENT ||
- img->_BaseFormat == GL_DEPTH_STENCIL) {
- GLenum depth_mode = t->Attrib.DepthMode;
-
- /* In ES 3.0, DEPTH_TEXTURE_MODE is expected to be GL_RED for textures
- * with depth component data specified with a sized internal format.
- * Otherwise, it's left at the old default, GL_LUMINANCE.
- */
- if (_mesa_is_gles3(ctx) &&
- img->InternalFormat != GL_DEPTH_COMPONENT &&
- img->InternalFormat != GL_DEPTH_STENCIL) {
- depth_mode = GL_RED;
- }
-
- switch (depth_mode) {
- case GL_ALPHA:
- swizzles[0] = SWIZZLE_ZERO;
- swizzles[1] = SWIZZLE_ZERO;
- swizzles[2] = SWIZZLE_ZERO;
- swizzles[3] = SWIZZLE_X;
- break;
- case GL_LUMINANCE:
- swizzles[0] = SWIZZLE_X;
- swizzles[1] = SWIZZLE_X;
- swizzles[2] = SWIZZLE_X;
- swizzles[3] = SWIZZLE_ONE;
- break;
- case GL_INTENSITY:
- swizzles[0] = SWIZZLE_X;
- swizzles[1] = SWIZZLE_X;
- swizzles[2] = SWIZZLE_X;
- swizzles[3] = SWIZZLE_X;
- break;
- case GL_RED:
- swizzles[0] = SWIZZLE_X;
- swizzles[1] = SWIZZLE_ZERO;
- swizzles[2] = SWIZZLE_ZERO;
- swizzles[3] = SWIZZLE_ONE;
- break;
- }
- }
-
- GLenum datatype = _mesa_get_format_datatype(img->TexFormat);
-
- /* If the texture's format is alpha-only, force R, G, and B to
- * 0.0. Similarly, if the texture's format has no alpha channel,
- * force the alpha value read to 1.0. This allows for the
- * implementation to use an RGBA texture for any of these formats
- * without leaking any unexpected values.
- */
- switch (img->_BaseFormat) {
- case GL_ALPHA:
- swizzles[0] = SWIZZLE_ZERO;
- swizzles[1] = SWIZZLE_ZERO;
- swizzles[2] = SWIZZLE_ZERO;
- break;
- case GL_LUMINANCE:
- if (t->_IsIntegerFormat || datatype == GL_SIGNED_NORMALIZED) {
- swizzles[0] = SWIZZLE_X;
- swizzles[1] = SWIZZLE_X;
- swizzles[2] = SWIZZLE_X;
- swizzles[3] = SWIZZLE_ONE;
- }
- break;
- case GL_LUMINANCE_ALPHA:
- if (datatype == GL_SIGNED_NORMALIZED) {
- swizzles[0] = SWIZZLE_X;
- swizzles[1] = SWIZZLE_X;
- swizzles[2] = SWIZZLE_X;
- swizzles[3] = SWIZZLE_W;
- }
- break;
- case GL_INTENSITY:
- if (datatype == GL_SIGNED_NORMALIZED) {
- swizzles[0] = SWIZZLE_X;
- swizzles[1] = SWIZZLE_X;
- swizzles[2] = SWIZZLE_X;
- swizzles[3] = SWIZZLE_X;
- }
- break;
- case GL_RED:
- if (img->TexFormat == MESA_FORMAT_R_SRGB8) {
- swizzles[0] = SWIZZLE_X;
- swizzles[1] = SWIZZLE_ZERO;
- swizzles[2] = SWIZZLE_ZERO;
- swizzles[3] = SWIZZLE_ONE;
- break;
- }
- FALLTHROUGH;
- case GL_RG:
- case GL_RGB:
- if (_mesa_get_format_bits(img->TexFormat, GL_ALPHA_BITS) > 0 ||
- img->TexFormat == MESA_FORMAT_RGB_DXT1 ||
- img->TexFormat == MESA_FORMAT_SRGB_DXT1)
- swizzles[3] = SWIZZLE_ONE;
- break;
- }
-
- return MAKE_SWIZZLE4(swizzles[GET_SWZ(t->Attrib._Swizzle, 0)],
- swizzles[GET_SWZ(t->Attrib._Swizzle, 1)],
- swizzles[GET_SWZ(t->Attrib._Swizzle, 2)],
- swizzles[GET_SWZ(t->Attrib._Swizzle, 3)]);
-}
-
-/**
- * Convert an swizzle enumeration (i.e. SWIZZLE_X) to one of the Gfx7.5+
- * "Shader Channel Select" enumerations (i.e. HSW_SCS_RED). The mappings are
- *
- * SWIZZLE_X, SWIZZLE_Y, SWIZZLE_Z, SWIZZLE_W, SWIZZLE_ZERO, SWIZZLE_ONE
- * 0 1 2 3 4 5
- * 4 5 6 7 0 1
- * SCS_RED, SCS_GREEN, SCS_BLUE, SCS_ALPHA, SCS_ZERO, SCS_ONE
- *
- * which is simply adding 4 then modding by 8 (or anding with 7).
- *
- * We then may need to apply workarounds for textureGather hardware bugs.
- */
-static unsigned
-swizzle_to_scs(GLenum swizzle, bool need_green_to_blue)
-{
- unsigned scs = (swizzle + 4) & 7;
-
- return (need_green_to_blue && scs == HSW_SCS_GREEN) ? HSW_SCS_BLUE : scs;
-}
-
-static void brw_update_texture_surface(struct gl_context *ctx,
- unsigned unit,
- uint32_t *surf_offset,
- bool for_gather,
- bool for_txf,
- uint32_t plane)
-{
- struct brw_context *brw = brw_context(ctx);
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- struct gl_texture_object *obj = ctx->Texture.Unit[unit]._Current;
-
- if (obj->Target == GL_TEXTURE_BUFFER) {
- brw_update_buffer_texture_surface(ctx, unit, surf_offset);
-
- } else {
- struct brw_texture_object *intel_obj = brw_texture_object(obj);
- struct brw_mipmap_tree *mt = intel_obj->mt;
-
- if (plane > 0) {
- if (mt->plane[plane - 1] == NULL)
- return;
- mt = mt->plane[plane - 1];
- }
-
- struct gl_sampler_object *sampler = _mesa_get_samplerobj(ctx, unit);
- /* If this is a view with restricted NumLayers, then our effective depth
- * is not just the miptree depth.
- */
- unsigned view_num_layers;
- if (obj->Immutable && obj->Target != GL_TEXTURE_3D) {
- view_num_layers = obj->Attrib.NumLayers;
- } else {
- view_num_layers = mt->surf.dim == ISL_SURF_DIM_3D ?
- mt->surf.logical_level0_px.depth :
- mt->surf.logical_level0_px.array_len;
- }
-
- /* Handling GL_ALPHA as a surface format override breaks 1.30+ style
- * texturing functions that return a float, as our code generation always
- * selects the .x channel (which would always be 0).
- */
- struct gl_texture_image *firstImage = obj->Image[0][obj->Attrib.BaseLevel];
- const bool alpha_depth = obj->Attrib.DepthMode == GL_ALPHA &&
- (firstImage->_BaseFormat == GL_DEPTH_COMPONENT ||
- firstImage->_BaseFormat == GL_DEPTH_STENCIL);
- const unsigned swizzle = (unlikely(alpha_depth) ? SWIZZLE_XYZW :
- brw_get_texture_swizzle(&brw->ctx, obj));
-
- mesa_format mesa_fmt;
- if (firstImage->_BaseFormat == GL_DEPTH_STENCIL ||
- firstImage->_BaseFormat == GL_DEPTH_COMPONENT) {
- /* The format from intel_obj may be a combined depth stencil format
- * when we just want depth. Pull it from the miptree instead. This
- * is safe because texture views aren't allowed on depth/stencil.
- */
- mesa_fmt = mt->format;
- } else if (brw_miptree_has_etc_shadow(brw, mt)) {
- mesa_fmt = mt->shadow_mt->format;
- } else if (plane > 0) {
- mesa_fmt = mt->format;
- } else {
- mesa_fmt = intel_obj->_Format;
- }
- enum isl_format format = translate_tex_format(brw, mesa_fmt,
- for_txf ? GL_DECODE_EXT :
- sampler->Attrib.sRGBDecode);
-
- /* Implement gfx6 and gfx7 gather work-around */
- bool need_green_to_blue = false;
- if (for_gather) {
- if (devinfo->ver == 7 && (format == ISL_FORMAT_R32G32_FLOAT ||
- format == ISL_FORMAT_R32G32_SINT ||
- format == ISL_FORMAT_R32G32_UINT)) {
- format = ISL_FORMAT_R32G32_FLOAT_LD;
- need_green_to_blue = devinfo->is_haswell;
- } else if (devinfo->ver == 6) {
- /* Sandybridge's gather4 message is broken for integer formats.
- * To work around this, we pretend the surface is UNORM for
- * 8 or 16-bit formats, and emit shader instructions to recover
- * the real INT/UINT value. For 32-bit formats, we pretend
- * the surface is FLOAT, and simply reinterpret the resulting
- * bits.
- */
- switch (format) {
- case ISL_FORMAT_R8_SINT:
- case ISL_FORMAT_R8_UINT:
- format = ISL_FORMAT_R8_UNORM;
- break;
-
- case ISL_FORMAT_R16_SINT:
- case ISL_FORMAT_R16_UINT:
- format = ISL_FORMAT_R16_UNORM;
- break;
-
- case ISL_FORMAT_R32_SINT:
- case ISL_FORMAT_R32_UINT:
- format = ISL_FORMAT_R32_FLOAT;
- break;
-
- default:
- break;
- }
- }
- }
-
- if (obj->StencilSampling && firstImage->_BaseFormat == GL_DEPTH_STENCIL) {
- if (devinfo->ver <= 7) {
- assert(mt->shadow_mt && !mt->stencil_mt->shadow_needs_update);
- mt = mt->shadow_mt;
- } else {
- mt = mt->stencil_mt;
- }
- format = ISL_FORMAT_R8_UINT;
- } else if (devinfo->ver <= 7 && mt->format == MESA_FORMAT_S_UINT8) {
- assert(mt->shadow_mt && !mt->shadow_needs_update);
- mt = mt->shadow_mt;
- format = ISL_FORMAT_R8_UINT;
- } else if (brw_miptree_needs_fake_etc(brw, mt)) {
- assert(mt->shadow_mt && !mt->shadow_needs_update);
- mt = mt->shadow_mt;
- }
-
- const int surf_index = surf_offset - &brw->wm.base.surf_offset[0];
-
- struct isl_view view = {
- .format = format,
- .base_level = obj->Attrib.MinLevel + obj->Attrib.BaseLevel,
- .levels = intel_obj->_MaxLevel - obj->Attrib.BaseLevel + 1,
- .base_array_layer = obj->Attrib.MinLayer,
- .array_len = view_num_layers,
- .swizzle = {
- .r = swizzle_to_scs(GET_SWZ(swizzle, 0), need_green_to_blue),
- .g = swizzle_to_scs(GET_SWZ(swizzle, 1), need_green_to_blue),
- .b = swizzle_to_scs(GET_SWZ(swizzle, 2), need_green_to_blue),
- .a = swizzle_to_scs(GET_SWZ(swizzle, 3), need_green_to_blue),
- },
- .usage = ISL_SURF_USAGE_TEXTURE_BIT,
- };
-
- /* On Ivy Bridge and earlier, we handle texture swizzle with shader
- * code. The actual surface swizzle should be identity.
- */
- if (devinfo->verx10 <= 70)
- view.swizzle = ISL_SWIZZLE_IDENTITY;
-
- if (obj->Target == GL_TEXTURE_CUBE_MAP ||
- obj->Target == GL_TEXTURE_CUBE_MAP_ARRAY)
- view.usage |= ISL_SURF_USAGE_CUBE_BIT;
-
- enum isl_aux_usage aux_usage =
- brw_miptree_texture_aux_usage(brw, mt, format,
- brw->gfx9_astc5x5_wa_tex_mask);
-
- brw_emit_surface_state(brw, mt, mt->target, view, aux_usage,
- surf_offset, surf_index,
- 0);
- }
-}
-
-void
-brw_emit_buffer_surface_state(struct brw_context *brw,
- uint32_t *out_offset,
- struct brw_bo *bo,
- unsigned buffer_offset,
- enum isl_format format,
- unsigned buffer_size,
- unsigned pitch,
- unsigned reloc_flags)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- uint32_t *dw = brw_state_batch(brw,
- brw->isl_dev.ss.size,
- brw->isl_dev.ss.align,
- out_offset);
-
- isl_buffer_fill_state(&brw->isl_dev, dw,
- .address = !bo ? buffer_offset :
- brw_state_reloc(&brw->batch,
- *out_offset + brw->isl_dev.ss.addr_offset,
- bo, buffer_offset,
- reloc_flags),
- .size_B = buffer_size,
- .format = format,
- .swizzle = ISL_SWIZZLE_IDENTITY,
- .stride_B = pitch,
- .mocs = brw_get_bo_mocs(devinfo, bo));
-}
-
-static unsigned
-buffer_texture_range_size(struct brw_context *brw,
- struct gl_texture_object *obj)
-{
- assert(obj->Target == GL_TEXTURE_BUFFER);
- const unsigned texel_size = _mesa_get_format_bytes(obj->_BufferObjectFormat);
- const unsigned buffer_size = (!obj->BufferObject ? 0 :
- obj->BufferObject->Size);
- const unsigned buffer_offset = MIN2(buffer_size, obj->BufferOffset);
-
- /* The ARB_texture_buffer_specification says:
- *
- * "The number of texels in the buffer texture's texel array is given by
- *
- * floor(<buffer_size> / (<components> * sizeof(<base_type>)),
- *
- * where <buffer_size> is the size of the buffer object, in basic
- * machine units and <components> and <base_type> are the element count
- * and base data type for elements, as specified in Table X.1. The
- * number of texels in the texel array is then clamped to the
- * implementation-dependent limit MAX_TEXTURE_BUFFER_SIZE_ARB."
- *
- * We need to clamp the size in bytes to MAX_TEXTURE_BUFFER_SIZE * stride,
- * so that when ISL divides by stride to obtain the number of texels, that
- * texel count is clamped to MAX_TEXTURE_BUFFER_SIZE.
- */
- return MIN3((unsigned)obj->BufferSize,
- buffer_size - buffer_offset,
- brw->ctx.Const.MaxTextureBufferSize * texel_size);
-}
-
-void
-brw_update_buffer_texture_surface(struct gl_context *ctx,
- unsigned unit,
- uint32_t *surf_offset)
-{
- struct brw_context *brw = brw_context(ctx);
- struct gl_texture_object *tObj = ctx->Texture.Unit[unit]._Current;
- struct brw_buffer_object *intel_obj =
- brw_buffer_object(tObj->BufferObject);
- const unsigned size = buffer_texture_range_size(brw, tObj);
- struct brw_bo *bo = NULL;
- mesa_format format = tObj->_BufferObjectFormat;
- const enum isl_format isl_format = brw_isl_format_for_mesa_format(format);
- int texel_size = _mesa_get_format_bytes(format);
-
- if (intel_obj)
- bo = brw_bufferobj_buffer(brw, intel_obj, tObj->BufferOffset, size,
- false);
-
- if (isl_format == ISL_FORMAT_UNSUPPORTED) {
- _mesa_problem(NULL, "bad format %s for texture buffer\n",
- _mesa_get_format_name(format));
- }
-
- brw_emit_buffer_surface_state(brw, surf_offset, bo,
- tObj->BufferOffset,
- isl_format,
- size,
- texel_size,
- 0);
-}
-
-/**
- * Set up a binding table entry for use by stream output logic (transform
- * feedback).
- *
- * buffer_size_minus_1 must be less than BRW_MAX_NUM_BUFFER_ENTRIES.
- */
-void
-brw_update_sol_surface(struct brw_context *brw,
- struct gl_buffer_object *buffer_obj,
- uint32_t *out_offset, unsigned num_vector_components,
- unsigned stride_dwords, unsigned offset_dwords)
-{
- struct brw_buffer_object *intel_bo = brw_buffer_object(buffer_obj);
- uint32_t offset_bytes = 4 * offset_dwords;
- struct brw_bo *bo = brw_bufferobj_buffer(brw, intel_bo,
- offset_bytes,
- buffer_obj->Size - offset_bytes,
- true);
- uint32_t *surf = brw_state_batch(brw, 6 * 4, 32, out_offset);
- uint32_t pitch_minus_1 = 4*stride_dwords - 1;
- size_t size_dwords = buffer_obj->Size / 4;
- uint32_t buffer_size_minus_1, width, height, depth, surface_format;
-
- /* FIXME: can we rely on core Mesa to ensure that the buffer isn't
- * too big to map using a single binding table entry?
- */
- assert((size_dwords - offset_dwords) / stride_dwords
- <= BRW_MAX_NUM_BUFFER_ENTRIES);
-
- if (size_dwords > offset_dwords + num_vector_components) {
- /* There is room for at least 1 transform feedback output in the buffer.
- * Compute the number of additional transform feedback outputs the
- * buffer has room for.
- */
- buffer_size_minus_1 =
- (size_dwords - offset_dwords - num_vector_components) / stride_dwords;
- } else {
- /* There isn't even room for a single transform feedback output in the
- * buffer. We can't configure the binding table entry to prevent output
- * entirely; we'll have to rely on the geometry shader to detect
- * overflow. But to minimize the damage in case of a bug, set up the
- * binding table entry to just allow a single output.
- */
- buffer_size_minus_1 = 0;
- }
- width = buffer_size_minus_1 & 0x7f;
- height = (buffer_size_minus_1 & 0xfff80) >> 7;
- depth = (buffer_size_minus_1 & 0x7f00000) >> 20;
-
- switch (num_vector_components) {
- case 1:
- surface_format = ISL_FORMAT_R32_FLOAT;
- break;
- case 2:
- surface_format = ISL_FORMAT_R32G32_FLOAT;
- break;
- case 3:
- surface_format = ISL_FORMAT_R32G32B32_FLOAT;
- break;
- case 4:
- surface_format = ISL_FORMAT_R32G32B32A32_FLOAT;
- break;
- default:
- unreachable("Invalid vector size for transform feedback output");
- }
-
- surf[0] = BRW_SURFACE_BUFFER << BRW_SURFACE_TYPE_SHIFT |
- BRW_SURFACE_MIPMAPLAYOUT_BELOW << BRW_SURFACE_MIPLAYOUT_SHIFT |
- surface_format << BRW_SURFACE_FORMAT_SHIFT |
- BRW_SURFACE_RC_READ_WRITE;
- surf[1] = brw_state_reloc(&brw->batch,
- *out_offset + 4, bo, offset_bytes, RELOC_WRITE);
- surf[2] = (width << BRW_SURFACE_WIDTH_SHIFT |
- height << BRW_SURFACE_HEIGHT_SHIFT);
- surf[3] = (depth << BRW_SURFACE_DEPTH_SHIFT |
- pitch_minus_1 << BRW_SURFACE_PITCH_SHIFT);
- surf[4] = 0;
- surf[5] = 0;
-}
-
-/* Creates a new WM constant buffer reflecting the current fragment program's
- * constants, if needed by the fragment program.
- *
- * Otherwise, constants go through the CURBEs using the brw_constant_buffer
- * state atom.
- */
-static void
-brw_upload_wm_pull_constants(struct brw_context *brw)
-{
- struct brw_stage_state *stage_state = &brw->wm.base;
- /* BRW_NEW_FRAGMENT_PROGRAM */
- struct brw_program *fp =
- (struct brw_program *) brw->programs[MESA_SHADER_FRAGMENT];
-
- /* BRW_NEW_FS_PROG_DATA */
- struct brw_stage_prog_data *prog_data = brw->wm.base.prog_data;
-
- _mesa_shader_write_subroutine_indices(&brw->ctx, MESA_SHADER_FRAGMENT);
- /* _NEW_PROGRAM_CONSTANTS */
- brw_upload_pull_constants(brw, BRW_NEW_SURFACES, &fp->program,
- stage_state, prog_data);
-}
-
-const struct brw_tracked_state brw_wm_pull_constants = {
- .dirty = {
- .mesa = _NEW_PROGRAM_CONSTANTS,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_FRAGMENT_PROGRAM |
- BRW_NEW_FS_PROG_DATA,
- },
- .emit = brw_upload_wm_pull_constants,
-};
-
-/**
- * Creates a null renderbuffer surface.
- *
- * This is used when the shader doesn't write to any color output. An FB
- * write to target 0 will still be emitted, because that's how the thread is
- * terminated (and computed depth is returned), so we need to have the
- * hardware discard the target 0 color output..
- */
-static void
-emit_null_surface_state(struct brw_context *brw,
- const struct gl_framebuffer *fb,
- uint32_t *out_offset)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- uint32_t *surf = brw_state_batch(brw,
- brw->isl_dev.ss.size,
- brw->isl_dev.ss.align,
- out_offset);
-
- /* Use the fb dimensions or 1x1x1 */
- const unsigned width = fb ? _mesa_geometric_width(fb) : 1;
- const unsigned height = fb ? _mesa_geometric_height(fb) : 1;
- const unsigned samples = fb ? _mesa_geometric_samples(fb) : 1;
-
- if (devinfo->ver != 6 || samples <= 1) {
- isl_null_fill_state(&brw->isl_dev, surf,
- .size = isl_extent3d(width, height, 1));
- return;
- }
-
- /* On Gfx6, null render targets seem to cause GPU hangs when multisampling.
- * So work around this problem by rendering into dummy color buffer.
- *
- * To decrease the amount of memory needed by the workaround buffer, we
- * set its pitch to 128 bytes (the width of a Y tile). This means that
- * the amount of memory needed for the workaround buffer is
- * (width_in_tiles + height_in_tiles - 1) tiles.
- *
- * Note that since the workaround buffer will be interpreted by the
- * hardware as an interleaved multisampled buffer, we need to compute
- * width_in_tiles and height_in_tiles by dividing the width and height
- * by 16 rather than the normal Y-tile size of 32.
- */
- unsigned width_in_tiles = ALIGN(width, 16) / 16;
- unsigned height_in_tiles = ALIGN(height, 16) / 16;
- unsigned pitch_minus_1 = 127;
- unsigned size_needed = (width_in_tiles + height_in_tiles - 1) * 4096;
- brw_get_scratch_bo(brw, &brw->wm.multisampled_null_render_target_bo,
- size_needed);
-
- surf[0] = (BRW_SURFACE_2D << BRW_SURFACE_TYPE_SHIFT |
- ISL_FORMAT_B8G8R8A8_UNORM << BRW_SURFACE_FORMAT_SHIFT);
- surf[1] = brw_state_reloc(&brw->batch, *out_offset + 4,
- brw->wm.multisampled_null_render_target_bo,
- 0, RELOC_WRITE);
-
- surf[2] = ((width - 1) << BRW_SURFACE_WIDTH_SHIFT |
- (height - 1) << BRW_SURFACE_HEIGHT_SHIFT);
-
- /* From Sandy bridge PRM, Vol4 Part1 p82 (Tiled Surface: Programming
- * Notes):
- *
- * If Surface Type is SURFTYPE_NULL, this field must be TRUE
- */
- surf[3] = (BRW_SURFACE_TILED | BRW_SURFACE_TILED_Y |
- pitch_minus_1 << BRW_SURFACE_PITCH_SHIFT);
- surf[4] = BRW_SURFACE_MULTISAMPLECOUNT_4;
- surf[5] = 0;
-}
-
-/**
- * Sets up a surface state structure to point at the given region.
- * While it is only used for the front/back buffer currently, it should be
- * usable for further buffers when doing ARB_draw_buffer support.
- */
-static uint32_t
-gfx4_update_renderbuffer_surface(struct brw_context *brw,
- struct gl_renderbuffer *rb,
- unsigned unit,
- uint32_t surf_index)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- struct gl_context *ctx = &brw->ctx;
- struct brw_renderbuffer *irb = brw_renderbuffer(rb);
- struct brw_mipmap_tree *mt = irb->mt;
- uint32_t *surf;
- uint32_t tile_x, tile_y;
- enum isl_format format;
- uint32_t offset;
- /* _NEW_BUFFERS */
- mesa_format rb_format = _mesa_get_render_format(ctx, brw_rb_format(irb));
- /* BRW_NEW_FS_PROG_DATA */
-
- if (rb->TexImage && !devinfo->has_surface_tile_offset) {
- brw_renderbuffer_get_tile_offsets(irb, &tile_x, &tile_y);
-
- if (tile_x != 0 || tile_y != 0) {
- /* Original gfx4 hardware couldn't draw to a non-tile-aligned
- * destination in a miptree unless you actually setup your renderbuffer
- * as a miptree and used the fragile lod/array_index/etc. controls to
- * select the image. So, instead, we just make a new single-level
- * miptree and render into that.
- */
- brw_renderbuffer_move_to_temp(brw, irb, false);
- assert(irb->align_wa_mt);
- mt = irb->align_wa_mt;
- }
- }
-
- surf = brw_state_batch(brw, 6 * 4, 32, &offset);
-
- format = brw->mesa_to_isl_render_format[rb_format];
- if (unlikely(!brw->mesa_format_supports_render[rb_format])) {
- _mesa_problem(ctx, "%s: renderbuffer format %s unsupported\n",
- __func__, _mesa_get_format_name(rb_format));
- }
-
- surf[0] = (BRW_SURFACE_2D << BRW_SURFACE_TYPE_SHIFT |
- format << BRW_SURFACE_FORMAT_SHIFT);
-
- /* reloc */
- assert(mt->offset % mt->cpp == 0);
- surf[1] = brw_state_reloc(&brw->batch, offset + 4, mt->bo,
- mt->offset +
- brw_renderbuffer_get_tile_offsets(irb,
- &tile_x,
- &tile_y),
- RELOC_WRITE);
-
- surf[2] = ((rb->Width - 1) << BRW_SURFACE_WIDTH_SHIFT |
- (rb->Height - 1) << BRW_SURFACE_HEIGHT_SHIFT);
-
- surf[3] = (brw_get_surface_tiling_bits(mt->surf.tiling) |
- (mt->surf.row_pitch_B - 1) << BRW_SURFACE_PITCH_SHIFT);
-
- surf[4] = brw_get_surface_num_multisamples(mt->surf.samples);
-
- assert(devinfo->has_surface_tile_offset || (tile_x == 0 && tile_y == 0));
- /* Note that the low bits of these fields are missing, so
- * there's the possibility of getting in trouble.
- */
- assert(tile_x % 4 == 0);
- assert(tile_y % 2 == 0);
- surf[5] = ((tile_x / 4) << BRW_SURFACE_X_OFFSET_SHIFT |
- (tile_y / 2) << BRW_SURFACE_Y_OFFSET_SHIFT |
- (mt->surf.image_alignment_el.height == 4 ?
- BRW_SURFACE_VERTICAL_ALIGN_ENABLE : 0));
-
- if (devinfo->ver < 6) {
- /* _NEW_COLOR */
- if (!ctx->Color.ColorLogicOpEnabled &&
- ctx->Color._AdvancedBlendMode == BLEND_NONE &&
- (ctx->Color.BlendEnabled & (1 << unit)))
- surf[0] |= BRW_SURFACE_BLEND_ENABLED;
-
- if (!GET_COLORMASK_BIT(ctx->Color.ColorMask, unit, 0))
- surf[0] |= 1 << BRW_SURFACE_WRITEDISABLE_R_SHIFT;
- if (!GET_COLORMASK_BIT(ctx->Color.ColorMask, unit, 1))
- surf[0] |= 1 << BRW_SURFACE_WRITEDISABLE_G_SHIFT;
- if (!GET_COLORMASK_BIT(ctx->Color.ColorMask, unit, 2))
- surf[0] |= 1 << BRW_SURFACE_WRITEDISABLE_B_SHIFT;
-
- /* As mentioned above, disable writes to the alpha component when the
- * renderbuffer is XRGB.
- */
- if (ctx->DrawBuffer->Visual.alphaBits == 0 ||
- !GET_COLORMASK_BIT(ctx->Color.ColorMask, unit, 3)) {
- surf[0] |= 1 << BRW_SURFACE_WRITEDISABLE_A_SHIFT;
- }
- }
-
- return offset;
-}
-
-static void
-update_renderbuffer_surfaces(struct brw_context *brw)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- const struct gl_context *ctx = &brw->ctx;
-
- /* _NEW_BUFFERS | _NEW_COLOR */
- const struct gl_framebuffer *fb = ctx->DrawBuffer;
-
- /* Render targets always start at binding table index 0. */
- const unsigned rt_start = 0;
-
- uint32_t *surf_offsets = brw->wm.base.surf_offset;
-
- /* Update surfaces for drawing buffers */
- if (fb->_NumColorDrawBuffers >= 1) {
- for (unsigned i = 0; i < fb->_NumColorDrawBuffers; i++) {
- struct gl_renderbuffer *rb = fb->_ColorDrawBuffers[i];
-
- if (brw_renderbuffer(rb)) {
- surf_offsets[rt_start + i] = devinfo->ver >= 6 ?
- gfx6_update_renderbuffer_surface(brw, rb, i, rt_start + i) :
- gfx4_update_renderbuffer_surface(brw, rb, i, rt_start + i);
- } else {
- emit_null_surface_state(brw, fb, &surf_offsets[rt_start + i]);
- }
- }
- } else {
- emit_null_surface_state(brw, fb, &surf_offsets[rt_start]);
- }
-
- /* The PIPE_CONTROL command description says:
- *
- * "Whenever a Binding Table Index (BTI) used by a Render Taget Message
- * points to a different RENDER_SURFACE_STATE, SW must issue a Render
- * Target Cache Flush by enabling this bit. When render target flush
- * is set due to new association of BTI, PS Scoreboard Stall bit must
- * be set in this packet."
- */
- if (devinfo->ver >= 11) {
- brw_emit_pipe_control_flush(brw,
- PIPE_CONTROL_RENDER_TARGET_FLUSH |
- PIPE_CONTROL_STALL_AT_SCOREBOARD);
- }
-
- brw->ctx.NewDriverState |= BRW_NEW_SURFACES;
-}
-
-const struct brw_tracked_state brw_renderbuffer_surfaces = {
- .dirty = {
- .mesa = _NEW_BUFFERS |
- _NEW_COLOR,
- .brw = BRW_NEW_BATCH,
- },
- .emit = update_renderbuffer_surfaces,
-};
-
-const struct brw_tracked_state gfx6_renderbuffer_surfaces = {
- .dirty = {
- .mesa = _NEW_BUFFERS,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_AUX_STATE,
- },
- .emit = update_renderbuffer_surfaces,
-};
-
-static void
-update_renderbuffer_read_surfaces(struct brw_context *brw)
-{
- const struct gl_context *ctx = &brw->ctx;
-
- /* BRW_NEW_FS_PROG_DATA */
- const struct brw_wm_prog_data *wm_prog_data =
- brw_wm_prog_data(brw->wm.base.prog_data);
-
- if (wm_prog_data->has_render_target_reads &&
- !ctx->Extensions.EXT_shader_framebuffer_fetch) {
- /* _NEW_BUFFERS */
- const struct gl_framebuffer *fb = ctx->DrawBuffer;
-
- for (unsigned i = 0; i < fb->_NumColorDrawBuffers; i++) {
- struct gl_renderbuffer *rb = fb->_ColorDrawBuffers[i];
- const struct brw_renderbuffer *irb = brw_renderbuffer(rb);
- const unsigned surf_index =
- wm_prog_data->binding_table.render_target_read_start + i;
- uint32_t *surf_offset = &brw->wm.base.surf_offset[surf_index];
-
- if (irb) {
- const enum isl_format format = brw->mesa_to_isl_render_format[
- _mesa_get_render_format(ctx, brw_rb_format(irb))];
- assert(isl_format_supports_sampling(&brw->screen->devinfo,
- format));
-
- /* Override the target of the texture if the render buffer is a
- * single slice of a 3D texture (since the minimum array element
- * field of the surface state structure is ignored by the sampler
- * unit for 3D textures on some hardware), or if the render buffer
- * is a 1D array (since shaders always provide the array index
- * coordinate at the Z component to avoid state-dependent
- * recompiles when changing the texture target of the
- * framebuffer).
- */
- const GLenum target =
- (irb->mt->target == GL_TEXTURE_3D &&
- irb->layer_count == 1) ? GL_TEXTURE_2D :
- irb->mt->target == GL_TEXTURE_1D_ARRAY ? GL_TEXTURE_2D_ARRAY :
- irb->mt->target;
-
- const struct isl_view view = {
- .format = format,
- .base_level = irb->mt_level - irb->mt->first_level,
- .levels = 1,
- .base_array_layer = irb->mt_layer,
- .array_len = irb->layer_count,
- .swizzle = ISL_SWIZZLE_IDENTITY,
- .usage = ISL_SURF_USAGE_TEXTURE_BIT,
- };
-
- enum isl_aux_usage aux_usage =
- brw_miptree_texture_aux_usage(brw, irb->mt, format,
- brw->gfx9_astc5x5_wa_tex_mask);
- if (brw->draw_aux_usage[i] == ISL_AUX_USAGE_NONE)
- aux_usage = ISL_AUX_USAGE_NONE;
-
- brw_emit_surface_state(brw, irb->mt, target, view, aux_usage,
- surf_offset, surf_index,
- 0);
-
- } else {
- emit_null_surface_state(brw, fb, surf_offset);
- }
- }
-
- brw->ctx.NewDriverState |= BRW_NEW_SURFACES;
- }
-}
-
-const struct brw_tracked_state brw_renderbuffer_read_surfaces = {
- .dirty = {
- .mesa = _NEW_BUFFERS,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_AUX_STATE |
- BRW_NEW_FS_PROG_DATA,
- },
- .emit = update_renderbuffer_read_surfaces,
-};
-
-static bool
-is_depth_texture(struct brw_texture_object *iobj)
-{
- GLenum base_format = _mesa_get_format_base_format(iobj->_Format);
- return base_format == GL_DEPTH_COMPONENT ||
- (base_format == GL_DEPTH_STENCIL && !iobj->base.StencilSampling);
-}
-
-static void
-update_stage_texture_surfaces(struct brw_context *brw,
- const struct gl_program *prog,
- struct brw_stage_state *stage_state,
- bool for_gather, uint32_t plane)
-{
- if (!prog)
- return;
-
- struct gl_context *ctx = &brw->ctx;
-
- uint32_t *surf_offset = stage_state->surf_offset;
-
- /* BRW_NEW_*_PROG_DATA */
- if (for_gather)
- surf_offset += stage_state->prog_data->binding_table.gather_texture_start;
- else
- surf_offset += stage_state->prog_data->binding_table.plane_start[plane];
-
- unsigned num_samplers = BITSET_LAST_BIT(prog->info.textures_used);
- for (unsigned s = 0; s < num_samplers; s++) {
- surf_offset[s] = 0;
-
- if (BITSET_TEST(prog->info.textures_used, s)) {
- const unsigned unit = prog->SamplerUnits[s];
- const bool used_by_txf = BITSET_TEST(prog->info.textures_used_by_txf, s);
- struct gl_texture_object *obj = ctx->Texture.Unit[unit]._Current;
- struct brw_texture_object *iobj = brw_texture_object(obj);
-
- /* _NEW_TEXTURE */
- if (!obj)
- continue;
-
- if ((prog->ShadowSamplers & (1 << s)) && !is_depth_texture(iobj)) {
- /* A programming note for the sample_c message says:
- *
- * "The Surface Format of the associated surface must be
- * indicated as supporting shadow mapping as indicated in the
- * surface format table."
- *
- * Accessing non-depth textures via a sampler*Shadow type is
- * undefined. GLSL 4.50 page 162 says:
- *
- * "If a shadow texture call is made to a sampler that does not
- * represent a depth texture, then results are undefined."
- *
- * We give them a null surface (zeros) for undefined. We've seen
- * GPU hangs with color buffers and sample_c, so we try and avoid
- * those with this hack.
- */
- emit_null_surface_state(brw, NULL, surf_offset + s);
- } else {
- brw_update_texture_surface(ctx, unit, surf_offset + s, for_gather,
- used_by_txf, plane);
- }
- }
- }
-}
-
-
-/**
- * Construct SURFACE_STATE objects for enabled textures.
- */
-static void
-brw_update_texture_surfaces(struct brw_context *brw)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
-
- /* BRW_NEW_VERTEX_PROGRAM */
- struct gl_program *vs = brw->programs[MESA_SHADER_VERTEX];
-
- /* BRW_NEW_TESS_PROGRAMS */
- struct gl_program *tcs = brw->programs[MESA_SHADER_TESS_CTRL];
- struct gl_program *tes = brw->programs[MESA_SHADER_TESS_EVAL];
-
- /* BRW_NEW_GEOMETRY_PROGRAM */
- struct gl_program *gs = brw->programs[MESA_SHADER_GEOMETRY];
-
- /* BRW_NEW_FRAGMENT_PROGRAM */
- struct gl_program *fs = brw->programs[MESA_SHADER_FRAGMENT];
-
- /* _NEW_TEXTURE */
- update_stage_texture_surfaces(brw, vs, &brw->vs.base, false, 0);
- update_stage_texture_surfaces(brw, tcs, &brw->tcs.base, false, 0);
- update_stage_texture_surfaces(brw, tes, &brw->tes.base, false, 0);
- update_stage_texture_surfaces(brw, gs, &brw->gs.base, false, 0);
- update_stage_texture_surfaces(brw, fs, &brw->wm.base, false, 0);
-
- /* emit alternate set of surface state for gather. this
- * allows the surface format to be overriden for only the
- * gather4 messages. */
- if (devinfo->ver < 8) {
- if (vs && vs->info.uses_texture_gather)
- update_stage_texture_surfaces(brw, vs, &brw->vs.base, true, 0);
- if (tcs && tcs->info.uses_texture_gather)
- update_stage_texture_surfaces(brw, tcs, &brw->tcs.base, true, 0);
- if (tes && tes->info.uses_texture_gather)
- update_stage_texture_surfaces(brw, tes, &brw->tes.base, true, 0);
- if (gs && gs->info.uses_texture_gather)
- update_stage_texture_surfaces(brw, gs, &brw->gs.base, true, 0);
- if (fs && fs->info.uses_texture_gather)
- update_stage_texture_surfaces(brw, fs, &brw->wm.base, true, 0);
- }
-
- if (fs) {
- update_stage_texture_surfaces(brw, fs, &brw->wm.base, false, 1);
- update_stage_texture_surfaces(brw, fs, &brw->wm.base, false, 2);
- }
-
- brw->ctx.NewDriverState |= BRW_NEW_SURFACES;
-}
-
-const struct brw_tracked_state brw_texture_surfaces = {
- .dirty = {
- .mesa = _NEW_TEXTURE,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_AUX_STATE |
- BRW_NEW_FRAGMENT_PROGRAM |
- BRW_NEW_FS_PROG_DATA |
- BRW_NEW_GEOMETRY_PROGRAM |
- BRW_NEW_GS_PROG_DATA |
- BRW_NEW_TESS_PROGRAMS |
- BRW_NEW_TCS_PROG_DATA |
- BRW_NEW_TES_PROG_DATA |
- BRW_NEW_TEXTURE_BUFFER |
- BRW_NEW_VERTEX_PROGRAM |
- BRW_NEW_VS_PROG_DATA,
- },
- .emit = brw_update_texture_surfaces,
-};
-
-static void
-brw_update_cs_texture_surfaces(struct brw_context *brw)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
-
- /* BRW_NEW_COMPUTE_PROGRAM */
- struct gl_program *cs = brw->programs[MESA_SHADER_COMPUTE];
-
- /* _NEW_TEXTURE */
- update_stage_texture_surfaces(brw, cs, &brw->cs.base, false, 0);
-
- /* emit alternate set of surface state for gather. this
- * allows the surface format to be overriden for only the
- * gather4 messages.
- */
- if (devinfo->ver < 8) {
- if (cs && cs->info.uses_texture_gather)
- update_stage_texture_surfaces(brw, cs, &brw->cs.base, true, 0);
- }
-
- brw->ctx.NewDriverState |= BRW_NEW_SURFACES;
-}
-
-const struct brw_tracked_state brw_cs_texture_surfaces = {
- .dirty = {
- .mesa = _NEW_TEXTURE,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_COMPUTE_PROGRAM |
- BRW_NEW_AUX_STATE,
- },
- .emit = brw_update_cs_texture_surfaces,
-};
-
-static void
-upload_buffer_surface(struct brw_context *brw,
- struct gl_buffer_binding *binding,
- uint32_t *out_offset,
- enum isl_format format,
- unsigned reloc_flags)
-{
- if (!binding->BufferObject) {
- emit_null_surface_state(brw, NULL, out_offset);
- } else {
- ptrdiff_t size = binding->BufferObject->Size - binding->Offset;
- if (!binding->AutomaticSize)
- size = MIN2(size, binding->Size);
-
- if (size == 0) {
- emit_null_surface_state(brw, NULL, out_offset);
- return;
- }
-
- struct brw_buffer_object *iobj =
- brw_buffer_object(binding->BufferObject);
- struct brw_bo *bo =
- brw_bufferobj_buffer(brw, iobj, binding->Offset, size,
- (reloc_flags & RELOC_WRITE) != 0);
-
- brw_emit_buffer_surface_state(brw, out_offset, bo, binding->Offset,
- format, size, 1, reloc_flags);
- }
-}
-
-void
-brw_upload_ubo_surfaces(struct brw_context *brw, struct gl_program *prog,
- struct brw_stage_state *stage_state,
- struct brw_stage_prog_data *prog_data)
-{
- struct gl_context *ctx = &brw->ctx;
-
- if (!prog || (prog->info.num_ubos == 0 &&
- prog->info.num_ssbos == 0 &&
- prog->info.num_abos == 0))
- return;
-
- if (prog->info.num_ubos) {
- assert(prog_data->binding_table.ubo_start < BRW_MAX_SURFACES);
- uint32_t *ubo_surf_offsets =
- &stage_state->surf_offset[prog_data->binding_table.ubo_start];
-
- for (int i = 0; i < prog->info.num_ubos; i++) {
- struct gl_buffer_binding *binding =
- &ctx->UniformBufferBindings[prog->sh.UniformBlocks[i]->Binding];
- upload_buffer_surface(brw, binding, &ubo_surf_offsets[i],
- ISL_FORMAT_R32G32B32A32_FLOAT, 0);
- }
- }
-
- if (prog->info.num_ssbos || prog->info.num_abos) {
- assert(prog_data->binding_table.ssbo_start < BRW_MAX_SURFACES);
- uint32_t *ssbo_surf_offsets =
- &stage_state->surf_offset[prog_data->binding_table.ssbo_start];
- uint32_t *abo_surf_offsets = ssbo_surf_offsets + prog->info.num_ssbos;
-
- for (int i = 0; i < prog->info.num_abos; i++) {
- struct gl_buffer_binding *binding =
- &ctx->AtomicBufferBindings[prog->sh.AtomicBuffers[i]->Binding];
- upload_buffer_surface(brw, binding, &abo_surf_offsets[i],
- ISL_FORMAT_RAW, RELOC_WRITE);
- }
-
- for (int i = 0; i < prog->info.num_ssbos; i++) {
- struct gl_buffer_binding *binding =
- &ctx->ShaderStorageBufferBindings[prog->sh.ShaderStorageBlocks[i]->Binding];
-
- upload_buffer_surface(brw, binding, &ssbo_surf_offsets[i],
- ISL_FORMAT_RAW, RELOC_WRITE);
- }
- }
-
- stage_state->push_constants_dirty = true;
- brw->ctx.NewDriverState |= BRW_NEW_SURFACES;
-}
-
-static void
-brw_upload_wm_ubo_surfaces(struct brw_context *brw)
-{
- struct gl_context *ctx = &brw->ctx;
- /* _NEW_PROGRAM */
- struct gl_program *prog = ctx->FragmentProgram._Current;
-
- /* BRW_NEW_FS_PROG_DATA */
- brw_upload_ubo_surfaces(brw, prog, &brw->wm.base, brw->wm.base.prog_data);
-}
-
-const struct brw_tracked_state brw_wm_ubo_surfaces = {
- .dirty = {
- .mesa = _NEW_PROGRAM,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_FS_PROG_DATA |
- BRW_NEW_UNIFORM_BUFFER,
- },
- .emit = brw_upload_wm_ubo_surfaces,
-};
-
-static void
-brw_upload_cs_ubo_surfaces(struct brw_context *brw)
-{
- struct gl_context *ctx = &brw->ctx;
- /* _NEW_PROGRAM */
- struct gl_program *prog =
- ctx->_Shader->CurrentProgram[MESA_SHADER_COMPUTE];
-
- /* BRW_NEW_CS_PROG_DATA */
- brw_upload_ubo_surfaces(brw, prog, &brw->cs.base, brw->cs.base.prog_data);
-}
-
-const struct brw_tracked_state brw_cs_ubo_surfaces = {
- .dirty = {
- .mesa = _NEW_PROGRAM,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_CS_PROG_DATA |
- BRW_NEW_UNIFORM_BUFFER,
- },
- .emit = brw_upload_cs_ubo_surfaces,
-};
-
-static void
-brw_upload_cs_image_surfaces(struct brw_context *brw)
-{
- /* _NEW_PROGRAM */
- const struct gl_program *cp = brw->programs[MESA_SHADER_COMPUTE];
-
- if (cp) {
- /* BRW_NEW_CS_PROG_DATA, BRW_NEW_IMAGE_UNITS, _NEW_TEXTURE */
- brw_upload_image_surfaces(brw, cp, &brw->cs.base,
- brw->cs.base.prog_data);
- }
-}
-
-const struct brw_tracked_state brw_cs_image_surfaces = {
- .dirty = {
- .mesa = _NEW_TEXTURE | _NEW_PROGRAM,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_CS_PROG_DATA |
- BRW_NEW_AUX_STATE |
- BRW_NEW_IMAGE_UNITS
- },
- .emit = brw_upload_cs_image_surfaces,
-};
-
-static uint32_t
-get_image_format(struct brw_context *brw, mesa_format format, GLenum access)
-{
- const struct intel_device_info *devinfo = &brw->screen->devinfo;
- enum isl_format hw_format = brw_isl_format_for_mesa_format(format);
- if (access == GL_WRITE_ONLY || access == GL_NONE) {
- return hw_format;
- } else if (isl_has_matching_typed_storage_image_format(devinfo, hw_format)) {
- /* Typed surface reads support a very limited subset of the shader
- * image formats. Translate it into the closest format the
- * hardware supports.
- */
- return isl_lower_storage_image_format(devinfo, hw_format);
- } else {
- /* The hardware doesn't actually support a typed format that we can use
- * so we have to fall back to untyped read/write messages.
- */
- return ISL_FORMAT_RAW;
- }
-}
-
-static void
-update_default_image_param(struct brw_context *brw,
- struct gl_image_unit *u,
- struct brw_image_param *param)
-{
- memset(param, 0, sizeof(*param));
- /* Set the swizzling shifts to all-ones to effectively disable swizzling --
- * See emit_address_calculation() in brw_fs_surface_builder.cpp for a more
- * detailed explanation of these parameters.
- */
- param->swizzling[0] = 0xff;
- param->swizzling[1] = 0xff;
-}
-
-static void
-update_buffer_image_param(struct brw_context *brw,
- struct gl_image_unit *u,
- struct brw_image_param *param)
-{
- const unsigned size = buffer_texture_range_size(brw, u->TexObj);
- update_default_image_param(brw, u, param);
-
- param->size[0] = size / _mesa_get_format_bytes(u->_ActualFormat);
- param->stride[0] = _mesa_get_format_bytes(u->_ActualFormat);
-}
-
-static void
-update_image_surface(struct brw_context *brw,
- struct gl_image_unit *u,
- GLenum access,
- uint32_t *surf_offset,
- struct brw_image_param *param)
-{
- if (_mesa_is_image_unit_valid(&brw->ctx, u)) {
- struct gl_texture_object *obj = u->TexObj;
- const unsigned format = get_image_format(brw, u->_ActualFormat, access);
- const bool written = (access != GL_READ_ONLY && access != GL_NONE);
-
- if (obj->Target == GL_TEXTURE_BUFFER) {
- const unsigned texel_size = (format == ISL_FORMAT_RAW ? 1 :
- _mesa_get_format_bytes(u->_ActualFormat));
- const unsigned buffer_size = buffer_texture_range_size(brw, obj);
- struct brw_bo *const bo = !obj->BufferObject ? NULL :
- brw_bufferobj_buffer(brw, brw_buffer_object(obj->BufferObject),
- obj->BufferOffset, buffer_size, written);
-
- brw_emit_buffer_surface_state(
- brw, surf_offset, bo, obj->BufferOffset,
- format, buffer_size, texel_size,
- written ? RELOC_WRITE : 0);
-
- update_buffer_image_param(brw, u, param);
-
- } else {
- struct brw_texture_object *intel_obj = brw_texture_object(obj);
- struct brw_mipmap_tree *mt = intel_obj->mt;
-
- unsigned base_layer, num_layers;
- if (u->Layered) {
- if (obj->Target == GL_TEXTURE_3D) {
- base_layer = 0;
- num_layers = minify(mt->surf.logical_level0_px.depth, u->Level);
- } else {
- assert(obj->Immutable || obj->Attrib.MinLayer == 0);
- base_layer = obj->Attrib.MinLayer;
- num_layers = obj->Immutable ?
- obj->Attrib.NumLayers :
- mt->surf.logical_level0_px.array_len;
- }
- } else {
- base_layer = obj->Attrib.MinLayer + u->_Layer;
- num_layers = 1;
- }
-
- struct isl_view view = {
- .format = format,
- .base_level = obj->Attrib.MinLevel + u->Level,
- .levels = 1,
- .base_array_layer = base_layer,
- .array_len = num_layers,
- .swizzle = ISL_SWIZZLE_IDENTITY,
- .usage = ISL_SURF_USAGE_STORAGE_BIT,
- };
-
- if (format == ISL_FORMAT_RAW) {
- brw_emit_buffer_surface_state(
- brw, surf_offset, mt->bo, mt->offset,
- format, mt->bo->size - mt->offset, 1 /* pitch */,
- written ? RELOC_WRITE : 0);
-
- } else {
- const int surf_index = surf_offset - &brw->wm.base.surf_offset[0];
- assert(!brw_miptree_has_color_unresolved(mt,
- view.base_level, 1,
- view.base_array_layer,
- view.array_len));
- brw_emit_surface_state(brw, mt, mt->target, view,
- ISL_AUX_USAGE_NONE,
- surf_offset, surf_index,
- written ? RELOC_WRITE : 0);
- }
-
- isl_surf_fill_image_param(&brw->isl_dev, param, &mt->surf, &view);
- }
-
- } else {
- emit_null_surface_state(brw, NULL, surf_offset);
- update_default_image_param(brw, u, param);
- }
-}
-
-void
-brw_upload_image_surfaces(struct brw_context *brw,
- const struct gl_program *prog,
- struct brw_stage_state *stage_state,
- struct brw_stage_prog_data *prog_data)
-{
- assert(prog);
- struct gl_context *ctx = &brw->ctx;
-
- if (prog->info.num_images) {
- for (unsigned i = 0; i < prog->info.num_images; i++) {
- struct gl_image_unit *u = &ctx->ImageUnits[prog->sh.ImageUnits[i]];
- const unsigned surf_idx = prog_data->binding_table.image_start + i;
-
- update_image_surface(brw, u, prog->sh.ImageAccess[i],
- &stage_state->surf_offset[surf_idx],
- &stage_state->image_param[i]);
- }
-
- brw->ctx.NewDriverState |= BRW_NEW_SURFACES;
- /* This may have changed the image metadata dependent on the context
- * image unit state and passed to the program as uniforms, make sure
- * that push and pull constants are reuploaded.
- */
- brw->NewGLState |= _NEW_PROGRAM_CONSTANTS;
- }
-}
-
-static void
-brw_upload_wm_image_surfaces(struct brw_context *brw)
-{
- /* BRW_NEW_FRAGMENT_PROGRAM */
- const struct gl_program *wm = brw->programs[MESA_SHADER_FRAGMENT];
-
- if (wm) {
- /* BRW_NEW_FS_PROG_DATA, BRW_NEW_IMAGE_UNITS, _NEW_TEXTURE */
- brw_upload_image_surfaces(brw, wm, &brw->wm.base,
- brw->wm.base.prog_data);
- }
-}
-
-const struct brw_tracked_state brw_wm_image_surfaces = {
- .dirty = {
- .mesa = _NEW_TEXTURE,
- .brw = BRW_NEW_BATCH |
- BRW_NEW_AUX_STATE |
- BRW_NEW_FRAGMENT_PROGRAM |
- BRW_NEW_FS_PROG_DATA |
- BRW_NEW_IMAGE_UNITS
- },
- .emit = brw_upload_wm_image_surfaces,
-};
-
-static void
-brw_upload_cs_work_groups_surface(struct brw_context *brw)
-{
- struct gl_context *ctx = &brw->ctx;
- /* _NEW_PROGRAM */
- struct gl_program *prog =
- ctx->_Shader->CurrentProgram[MESA_SHADER_COMPUTE];
- /* BRW_NEW_CS_PROG_DATA */
- const struct brw_cs_prog_data *cs_prog_data =
- brw_cs_prog_data(brw->cs.base.prog_data);
-
- if (prog && cs_prog_data->uses_num_work_groups) {
- const unsigned surf_idx =
- cs_prog_data->binding_table.work_groups_start;
- uint32_t *surf_offset = &brw->cs.base.surf_offset[surf_idx];
- struct brw_bo *bo;
- uint32_t bo_offset;
-
- if (brw->compute.num_work_groups_bo == NULL) {
- bo = NULL;
- brw_upload_data(&brw->upload,
- (void *)brw->compute.num_work_groups,
- 3 * sizeof(GLuint),
- sizeof(GLuint),
- &bo,
- &bo_offset);
- } else {
- bo = brw->compute.num_work_groups_bo;
- bo_offset = brw->compute.num_work_groups_offset;
- }
-
- brw_emit_buffer_surface_state(brw, surf_offset,
- bo, bo_offset,
- ISL_FORMAT_RAW,
- 3 * sizeof(GLuint), 1,
- RELOC_WRITE);
-
- /* The state buffer now holds a reference to our upload, drop ours. */
- if (bo != brw->compute.num_work_groups_bo)
- brw_bo_unreference(bo);
-
- brw->ctx.NewDriverState |= BRW_NEW_SURFACES;
- }
-}
-
-const struct brw_tracked_state brw_cs_work_groups_surface = {
- .dirty = {
- .brw = BRW_NEW_CS_PROG_DATA |
- BRW_NEW_CS_WORK_GROUPS
- },
- .emit = brw_upload_cs_work_groups_surface,
-};