nir: Move workgroup_size and workgroup_variable_size into common shader_info

Move it out the "cs" sub-struct, since these will be used for other shader stages in the future. Reviewed-by: Kenneth Graunke <kenneth@whitecape.org> Part-of: <https://gitlab.freedesktop.org/mesa/mesa/-/merge_requests/11225>
author: Caio Marcelo de Oliveira Filho <caio.oliveira@intel.com> 2021-05-05 12:24:44 -0700
committer: Caio Marcelo de Oliveira Filho <caio.oliveira@intel.com> 2021-06-08 09:23:55 -0700
commit: 8af6766062044167fb3b61950ddbc7d67e4c3e48 (patch)
tree: 9d74934c90d19501867bfdc53dfd318d7e221114 /src/compiler
parent: b5f6fc442c1014e2e05f752d971a2276ae6cd13e (diff)
10 files changed, 81 insertions, 63 deletions
diff --git a/src/compiler/glsl/linker.cpp b/src/compiler/glsl/linker.cpp
index c67f4b0ff1e..df1bf920a76 100644
--- a/src/compiler/glsl/linker.cpp
+++ b/src/compiler/glsl/linker.cpp
@@ -2230,9 +2230,9 @@ link_cs_input_layout_qualifiers(struct gl_shader_program *prog,
       return;
 
    for (int i = 0; i < 3; i++)
-      gl_prog->info.cs.workgroup_size[i] = 0;
+      gl_prog->info.workgroup_size[i] = 0;
 
-   gl_prog->info.cs.workgroup_size_variable = false;
+   gl_prog->info.workgroup_size_variable = false;
 
    gl_prog->info.cs.derivative_group = DERIVATIVE_GROUP_NONE;
 
@@ -2250,9 +2250,9 @@ link_cs_input_layout_qualifiers(struct gl_shader_program *prog,
       struct gl_shader *shader = shader_list[sh];
 
       if (shader->info.Comp.LocalSize[0] != 0) {
-         if (gl_prog->info.cs.workgroup_size[0] != 0) {
+         if (gl_prog->info.workgroup_size[0] != 0) {
             for (int i = 0; i < 3; i++) {
-               if (gl_prog->info.cs.workgroup_size[i] !=
+               if (gl_prog->info.workgroup_size[i] !=
                    shader->info.Comp.LocalSize[i]) {
                   linker_error(prog, "compute shader defined with conflicting "
                                "local sizes\n");
@@ -2261,11 +2261,11 @@ link_cs_input_layout_qualifiers(struct gl_shader_program *prog,
             }
          }
          for (int i = 0; i < 3; i++) {
-            gl_prog->info.cs.workgroup_size[i] =
+            gl_prog->info.workgroup_size[i] =
                shader->info.Comp.LocalSize[i];
          }
       } else if (shader->info.Comp.LocalSizeVariable) {
-         if (gl_prog->info.cs.workgroup_size[0] != 0) {
+         if (gl_prog->info.workgroup_size[0] != 0) {
             /* The ARB_compute_variable_group_size spec says:
              *
              *     If one compute shader attached to a program declares a
@@ -2277,7 +2277,7 @@ link_cs_input_layout_qualifiers(struct gl_shader_program *prog,
                          "variable local group size\n");
             return;
          }
-         gl_prog->info.cs.workgroup_size_variable = true;
+         gl_prog->info.workgroup_size_variable = true;
       }
 
       enum gl_derivative_group group = shader->info.Comp.DerivativeGroup;
@@ -2296,30 +2296,30 @@ link_cs_input_layout_qualifiers(struct gl_shader_program *prog,
     * since we already know we're in the right type of shader program
     * for doing it.
     */
-   if (gl_prog->info.cs.workgroup_size[0] == 0 &&
-       !gl_prog->info.cs.workgroup_size_variable) {
+   if (gl_prog->info.workgroup_size[0] == 0 &&
+       !gl_prog->info.workgroup_size_variable) {
       linker_error(prog, "compute shader must contain a fixed or a variable "
                          "local group size\n");
       return;
    }
 
    if (gl_prog->info.cs.derivative_group == DERIVATIVE_GROUP_QUADS) {
-      if (gl_prog->info.cs.workgroup_size[0] % 2 != 0) {
+      if (gl_prog->info.workgroup_size[0] % 2 != 0) {
          linker_error(prog, "derivative_group_quadsNV must be used with a "
                       "local group size whose first dimension "
                       "is a multiple of 2\n");
          return;
       }
-      if (gl_prog->info.cs.workgroup_size[1] % 2 != 0) {
+      if (gl_prog->info.workgroup_size[1] % 2 != 0) {
          linker_error(prog, "derivative_group_quadsNV must be used with a local"
                       "group size whose second dimension "
                       "is a multiple of 2\n");
          return;
       }
    } else if (gl_prog->info.cs.derivative_group == DERIVATIVE_GROUP_LINEAR) {
-      if ((gl_prog->info.cs.workgroup_size[0] *
-           gl_prog->info.cs.workgroup_size[1] *
-           gl_prog->info.cs.workgroup_size[2]) % 4 != 0) {
+      if ((gl_prog->info.workgroup_size[0] *
+           gl_prog->info.workgroup_size[1] *
+           gl_prog->info.workgroup_size[2]) % 4 != 0) {
          linker_error(prog, "derivative_group_linearNV must be used with a "
                       "local group size whose total number of invocations "
                       "is a multiple of 4\n");
diff --git a/src/compiler/glsl/lower_cs_derived.cpp b/src/compiler/glsl/lower_cs_derived.cpp
index 99a0028fb6a..6faa99fad16 100644
--- a/src/compiler/glsl/lower_cs_derived.cpp
+++ b/src/compiler/glsl/lower_cs_derived.cpp
@@ -54,7 +54,7 @@ public:
    explicit lower_cs_derived_visitor(gl_linked_shader *shader)
       : progress(false),
         shader(shader),
-        local_size_variable(shader->Program->info.cs.workgroup_size_variable),
+        local_size_variable(shader->Program->info.workgroup_size_variable),
         gl_WorkGroupSize(NULL),
         gl_WorkGroupID(NULL),
         gl_LocalInvocationID(NULL),
@@ -144,7 +144,7 @@ lower_cs_derived_visitor::find_sysvals()
          ir_constant_data data;
          memset(&data, 0, sizeof(data));
          for (int i = 0; i < 3; i++)
-            data.u[i] = shader->Program->info.cs.workgroup_size[i];
+            data.u[i] = shader->Program->info.workgroup_size[i];
          gl_WorkGroupSize = new(shader) ir_constant(glsl_type::uvec3_type, &data);
       }
    }
diff --git a/src/compiler/nir/nir_lower_system_values.c b/src/compiler/nir/nir_lower_system_values.c
index 732b8e80a6b..60443050407 100644
--- a/src/compiler/nir/nir_lower_system_values.c
+++ b/src/compiler/nir/nir_lower_system_values.c
@@ -320,10 +320,10 @@ lower_compute_system_value_instr(nir_builder *b,
          nir_ssa_def *x = nir_channel(b, ids, 0);
          nir_ssa_def *y = nir_channel(b, ids, 1);
          nir_ssa_def *z = nir_channel(b, ids, 2);
-         unsigned size_x = b->shader->info.cs.workgroup_size[0];
+         unsigned size_x = b->shader->info.workgroup_size[0];
          nir_ssa_def *size_x_imm;
 
-         if (b->shader->info.cs.workgroup_size_variable)
+         if (b->shader->info.workgroup_size_variable)
             size_x_imm = nir_channel(b, nir_load_workgroup_size(b), 0);
          else
             size_x_imm = nir_imm_int(b, size_x);
@@ -371,7 +371,7 @@ lower_compute_system_value_instr(nir_builder *b,
                                          nir_ishl(b, x_bits_1n, one));
          nir_ssa_def *i;
 
-         if (!b->shader->info.cs.workgroup_size_variable &&
+         if (!b->shader->info.workgroup_size_variable &&
              util_is_power_of_two_nonzero(size_x)) {
             nir_ssa_def *log2_size_x = nir_imm_int(b, util_logbase2(size_x));
             i = nir_ior(b, bits_01x, nir_ishl(b, y_bits_1n, log2_size_x));
@@ -405,9 +405,9 @@ lower_compute_system_value_instr(nir_builder *b,
          nir_ssa_def *local_id = nir_load_local_invocation_id(b);
 
          nir_ssa_def *size_x =
-            nir_imm_int(b, b->shader->info.cs.workgroup_size[0]);
+            nir_imm_int(b, b->shader->info.workgroup_size[0]);
          nir_ssa_def *size_y =
-            nir_imm_int(b, b->shader->info.cs.workgroup_size[1]);
+            nir_imm_int(b, b->shader->info.workgroup_size[1]);
 
          /* Because no hardware supports a local workgroup size greater than
           * about 1K, this calculation can be done in 32-bit and can save some
@@ -425,7 +425,7 @@ lower_compute_system_value_instr(nir_builder *b,
       }
 
    case nir_intrinsic_load_workgroup_size:
-      if (b->shader->info.cs.workgroup_size_variable) {
+      if (b->shader->info.workgroup_size_variable) {
          /* If the local work group size is variable it can't be lowered at
           * this point.  We do, however, have to make sure that the intrinsic
           * is only 32-bit.
@@ -436,9 +436,9 @@ lower_compute_system_value_instr(nir_builder *b,
           * than 32 bits for the local size */
          nir_const_value workgroup_size_const[3];
          memset(workgroup_size_const, 0, sizeof(workgroup_size_const));
-         workgroup_size_const[0].u32 = b->shader->info.cs.workgroup_size[0];
-         workgroup_size_const[1].u32 = b->shader->info.cs.workgroup_size[1];
-         workgroup_size_const[2].u32 = b->shader->info.cs.workgroup_size[2];
+         workgroup_size_const[0].u32 = b->shader->info.workgroup_size[0];
+         workgroup_size_const[1].u32 = b->shader->info.workgroup_size[1];
+         workgroup_size_const[2].u32 = b->shader->info.workgroup_size[2];
          return nir_u2u(b, nir_build_imm(b, 3, 32, workgroup_size_const), bit_size);
       }
 
diff --git a/src/compiler/nir/nir_lower_variable_initializers.c b/src/compiler/nir/nir_lower_variable_initializers.c
index b26624f8cf6..ba0e7ba7be6 100644
--- a/src/compiler/nir/nir_lower_variable_initializers.c
+++ b/src/compiler/nir/nir_lower_variable_initializers.c
@@ -154,10 +154,10 @@ nir_zero_initialize_shared_memory(nir_shader *shader,
    nir_builder_init(&b, nir_shader_get_entrypoint(shader));
    b.cursor = nir_before_cf_list(&b.impl->body);
 
-   assert(!shader->info.cs.workgroup_size_variable);
-   const unsigned local_count = shader->info.cs.workgroup_size[0] *
-                                shader->info.cs.workgroup_size[1] *
-                                shader->info.cs.workgroup_size[2];
+   assert(!shader->info.workgroup_size_variable);
+   const unsigned local_count = shader->info.workgroup_size[0] *
+                                shader->info.workgroup_size[1] *
+                                shader->info.workgroup_size[2];
 
    /* The initialization logic is simplified if we can always split the memory
     * in full chunk_size units.
diff --git a/src/compiler/nir/nir_opt_uniform_atomics.c b/src/compiler/nir/nir_opt_uniform_atomics.c
index 433803cb35e..2c64e3198a4 100644
--- a/src/compiler/nir/nir_opt_uniform_atomics.c
+++ b/src/compiler/nir/nir_opt_uniform_atomics.c
@@ -169,7 +169,7 @@ is_atomic_already_optimized(nir_shader *shader, nir_intrinsic_instr *instr)
 
    unsigned dims_needed = 0;
    for (unsigned i = 0; i < 3; i++)
-      dims_needed |= (shader->info.cs.workgroup_size[i] > 1) << i;
+      dims_needed |= (shader->info.workgroup_size[i] > 1) << i;
 
    return (dims & dims_needed) == dims_needed || dims & 0x8;
 }
@@ -306,9 +306,10 @@ nir_opt_uniform_atomics(nir_shader *shader)
    /* A 1x1x1 workgroup only ever has one active lane, so there's no point in
     * optimizing any atomics.
     */
-   if (shader->info.stage == MESA_SHADER_COMPUTE && !shader->info.cs.workgroup_size_variable &&
-       shader->info.cs.workgroup_size[0] == 1 && shader->info.cs.workgroup_size[1] == 1 &&
-       shader->info.cs.workgroup_size[2] == 1)
+   if (gl_shader_stage_uses_workgroup(shader->info.stage) &&
+       !shader->info.workgroup_size_variable &&
+       shader->info.workgroup_size[0] == 1 && shader->info.workgroup_size[1] == 1 &&
+       shader->info.workgroup_size[2] == 1)
       return false;
 
    nir_foreach_function(function, shader) {
diff --git a/src/compiler/nir/nir_print.c b/src/compiler/nir/nir_print.c
index 363a8e4aeb1..649d1de224d 100644
--- a/src/compiler/nir/nir_print.c
+++ b/src/compiler/nir/nir_print.c
@@ -1605,12 +1605,12 @@ nir_print_shader_annotated(nir_shader *shader, FILE *fp,
    if (shader->info.label)
       fprintf(fp, "label: %s\n", shader->info.label);
 
-   if (gl_shader_stage_is_compute(shader->info.stage)) {
+   if (gl_shader_stage_uses_workgroup(shader->info.stage)) {
       fprintf(fp, "workgroup-size: %u, %u, %u%s\n",
-              shader->info.cs.workgroup_size[0],
-              shader->info.cs.workgroup_size[1],
-              shader->info.cs.workgroup_size[2],
-              shader->info.cs.workgroup_size_variable ? " (variable)" : "");
+              shader->info.workgroup_size[0],
+              shader->info.workgroup_size[1],
+              shader->info.workgroup_size[2],
+              shader->info.workgroup_size_variable ? " (variable)" : "");
       fprintf(fp, "shared-size: %u\n", shader->info.shared_size);
    }
 
diff --git a/src/compiler/nir/nir_range_analysis.c b/src/compiler/nir/nir_range_analysis.c
index 18ac161d5e0..501084f14f5 100644
--- a/src/compiler/nir/nir_range_analysis.c
+++ b/src/compiler/nir/nir_range_analysis.c
@@ -1292,20 +1292,19 @@ nir_unsigned_upper_bound(nir_shader *shader, struct hash_table *range_ht,
       nir_intrinsic_instr *intrin = nir_instr_as_intrinsic(scalar.def->parent_instr);
       switch (intrin->intrinsic) {
       case nir_intrinsic_load_local_invocation_index:
-         if (shader->info.stage != MESA_SHADER_COMPUTE ||
-             shader->info.cs.workgroup_size_variable) {
+         if (shader->info.workgroup_size_variable) {
             res = config->max_workgroup_invocations - 1;
          } else {
-            res = (shader->info.cs.workgroup_size[0] *
-                   shader->info.cs.workgroup_size[1] *
-                   shader->info.cs.workgroup_size[2]) - 1u;
+            res = (shader->info.workgroup_size[0] *
+                   shader->info.workgroup_size[1] *
+                   shader->info.workgroup_size[2]) - 1u;
          }
          break;
       case nir_intrinsic_load_local_invocation_id:
-         if (shader->info.cs.workgroup_size_variable)
+         if (shader->info.workgroup_size_variable)
             res = config->max_workgroup_size[scalar.comp] - 1u;
          else
-            res = shader->info.cs.workgroup_size[scalar.comp] - 1u;
+            res = shader->info.workgroup_size[scalar.comp] - 1u;
          break;
       case nir_intrinsic_load_workgroup_id:
          res = config->max_workgroup_count[scalar.comp] - 1u;
@@ -1314,11 +1313,11 @@ nir_unsigned_upper_bound(nir_shader *shader, struct hash_table *range_ht,
          res = config->max_workgroup_count[scalar.comp];
          break;
       case nir_intrinsic_load_global_invocation_id:
-         if (shader->info.cs.workgroup_size_variable) {
+         if (shader->info.workgroup_size_variable) {
             res = mul_clamp(config->max_workgroup_size[scalar.comp],
                             config->max_workgroup_count[scalar.comp]) - 1u;
          } else {
-            res = (shader->info.cs.workgroup_size[scalar.comp] *
+            res = (shader->info.workgroup_size[scalar.comp] *
                    config->max_workgroup_count[scalar.comp]) - 1u;
          }
          break;
@@ -1339,10 +1338,11 @@ nir_unsigned_upper_bound(nir_shader *shader, struct hash_table *range_ht,
       case nir_intrinsic_load_subgroup_id:
       case nir_intrinsic_load_num_subgroups: {
          uint32_t workgroup_size = config->max_workgroup_invocations;
-         if (shader->info.stage == MESA_SHADER_COMPUTE && !shader->info.cs.workgroup_size_variable) {
-            workgroup_size = shader->info.cs.workgroup_size[0] *
-                             shader->info.cs.workgroup_size[1] *
-                             shader->info.cs.workgroup_size[2];
+         if (gl_shader_stage_uses_workgroup(shader->info.stage) &&
+             !shader->info.workgroup_size_variable) {
+            workgroup_size = shader->info.workgroup_size[0] *
+                             shader->info.workgroup_size[1] *
+                             shader->info.workgroup_size[2];
          }
          res = DIV_ROUND_UP(workgroup_size, config->min_subgroup_size);
          if (intrin->intrinsic == nir_intrinsic_load_subgroup_id)
diff --git a/src/compiler/shader_enums.h b/src/compiler/shader_enums.h
index 9350459a100..2728c4417ed 100644
--- a/src/compiler/shader_enums.h
+++ b/src/compiler/shader_enums.h
@@ -73,6 +73,15 @@ gl_shader_stage_is_compute(gl_shader_stage stage)
 }
 
 static inline bool
+gl_shader_stage_uses_workgroup(gl_shader_stage stage)
+{
+   return stage == MESA_SHADER_COMPUTE ||
+          stage == MESA_SHADER_KERNEL ||
+          stage == MESA_SHADER_TASK ||
+          stage == MESA_SHADER_MESH;
+}
+
+static inline bool
 gl_shader_stage_is_callable(gl_shader_stage stage)
 {
    return stage == MESA_SHADER_ANY_HIT ||
diff --git a/src/compiler/shader_info.h b/src/compiler/shader_info.h
index 7c18e565433..1bb2f8b966d 100644
--- a/src/compiler/shader_info.h
+++ b/src/compiler/shader_info.h
@@ -198,6 +198,11 @@ typedef struct shader_info {
     */
    unsigned shared_size;
 
+   /**
+    * Local workgroup size used by compute/task/mesh shaders.
+    */
+   uint16_t workgroup_size[3];
+
    uint16_t inlinable_uniform_dw_offsets[MAX_INLINABLE_UNIFORMS];
    uint8_t num_inlinable_uniforms:4;
 
@@ -259,6 +264,11 @@ typedef struct shader_info {
     */
    bool zero_initialize_shared_memory:1;
 
+   /**
+    * Used for ARB_compute_variable_group_size.
+    */
+   bool workgroup_size_variable:1;
+
    union {
       struct {
          /* Which inputs are doubles */
@@ -389,10 +399,8 @@ typedef struct shader_info {
       } fs;
 
       struct {
-         uint16_t workgroup_size[3];
          uint16_t workgroup_size_hint[3];
 
-         bool workgroup_size_variable:1;
          uint8_t user_data_components_amd:3;
 
          /*
diff --git a/src/compiler/spirv/spirv_to_nir.c b/src/compiler/spirv/spirv_to_nir.c
index d94577d23c8..2abf1144b01 100644
--- a/src/compiler/spirv/spirv_to_nir.c
+++ b/src/compiler/spirv/spirv_to_nir.c
@@ -4803,9 +4803,9 @@ vtn_handle_execution_mode(struct vtn_builder *b, struct vtn_value *entry_point,
 
    case SpvExecutionModeLocalSize:
       vtn_assert(gl_shader_stage_is_compute(b->shader->info.stage));
-      b->shader->info.cs.workgroup_size[0] = mode->operands[0];
-      b->shader->info.cs.workgroup_size[1] = mode->operands[1];
-      b->shader->info.cs.workgroup_size[2] = mode->operands[2];
+      b->shader->info.workgroup_size[0] = mode->operands[0];
+      b->shader->info.workgroup_size[1] = mode->operands[1];
+      b->shader->info.workgroup_size[2] = mode->operands[2];
       break;
 
    case SpvExecutionModeOutputVertices:
@@ -5016,9 +5016,9 @@ vtn_handle_execution_mode_id(struct vtn_builder *b, struct vtn_value *entry_poin
 
    switch (mode->exec_mode) {
    case SpvExecutionModeLocalSizeId:
-      b->shader->info.cs.workgroup_size[0] = vtn_constant_uint(b, mode->operands[0]);
-      b->shader->info.cs.workgroup_size[1] = vtn_constant_uint(b, mode->operands[1]);
-      b->shader->info.cs.workgroup_size[2] = vtn_constant_uint(b, mode->operands[2]);
+      b->shader->info.workgroup_size[0] = vtn_constant_uint(b, mode->operands[0]);
+      b->shader->info.workgroup_size[1] = vtn_constant_uint(b, mode->operands[1]);
+      b->shader->info.workgroup_size[2] = vtn_constant_uint(b, mode->operands[2]);
       break;
 
    case SpvExecutionModeLocalSizeHintId:
@@ -5986,16 +5986,16 @@ spirv_to_nir(const uint32_t *words, size_t word_count,
                                  vtn_handle_execution_mode_id, NULL);
 
    if (b->workgroup_size_builtin) {
-      vtn_assert(stage == MESA_SHADER_COMPUTE || stage == MESA_SHADER_KERNEL);
+      vtn_assert(gl_shader_stage_uses_workgroup(stage));
       vtn_assert(b->workgroup_size_builtin->type->type ==
                  glsl_vector_type(GLSL_TYPE_UINT, 3));
 
       nir_const_value *const_size =
          b->workgroup_size_builtin->constant->values;
 
-      b->shader->info.cs.workgroup_size[0] = const_size[0].u32;
-      b->shader->info.cs.workgroup_size[1] = const_size[1].u32;
-      b->shader->info.cs.workgroup_size[2] = const_size[2].u32;
+      b->shader->info.workgroup_size[0] = const_size[0].u32;
+      b->shader->info.workgroup_size[1] = const_size[1].u32;
+      b->shader->info.workgroup_size[2] = const_size[2].u32;
    }
 
    /* Set types on all vtn_values */
author	Caio Marcelo de Oliveira Filho <caio.oliveira@intel.com>	2021-05-05 12:24:44 -0700
committer	Caio Marcelo de Oliveira Filho <caio.oliveira@intel.com>	2021-06-08 09:23:55 -0700
commit	8af6766062044167fb3b61950ddbc7d67e4c3e48 (patch)
tree	9d74934c90d19501867bfdc53dfd318d7e221114 /src/compiler
parent	b5f6fc442c1014e2e05f752d971a2276ae6cd13e (diff)