i965/fs: Rework the persample shading key/prog_data bits

This commit reworks and simplifies the way we handle persample shading in the shader key and prog_data. The previous approach had three different key bits that had slightly different and hard-to-decern meanings while the new bits are far more clear. This commit changes it to two easily understood bits that communicate everything we need: 1) key->persample_interp: means that the user has requested persample interpolation through the API. This is equivalent to having SAMPLE_SHADING enabled and having MIN_SAMPLE_SHADING_VALUE set high enough that you actually get multiple per-sample invocations. 2) key->multisample_fbo: means that the shader will be running on an actual multi-sampled framebuffer. This commit also adds a new "persample_dispatch" bit to prog_data which indicates that the shader should be run in persample mode. This way the state setup code doesn't have to look at the fragment program or GL state and can just pull that data out of the prog_data. In theory, this shuffle could mean more recompiles. However, in practice, we were shoving enough state into the key before that we were probably hitting a recompile on every per-sample shader anyway. Reviewed-by: Kenneth Graunke <kenneth@whitecape.org>
author: Jason Ekstrand <jason.ekstrand@intel.com> 2016-05-09 17:48:24 -0700
committer: Jason Ekstrand <jason.ekstrand@intel.com> 2016-05-14 13:34:05 -0700
commit: 712a980adde0b14eee8b4accd02af9b9740091a2 (patch)
tree: 7bb3fbc03b59eb51c491013c8bcf29bd2b7e0f8b /src/mesa/drivers/dri/i965/gen7_wm_state.c
parent: a2f50d87b6e9d07c6974ef309cc99acf56b2dc09 (diff)
download: external_mesa3d-712a980adde0b14eee8b4accd02af9b9740091a2.zip
external_mesa3d-712a980adde0b14eee8b4accd02af9b9740091a2.tar.gz
external_mesa3d-712a980adde0b14eee8b4accd02af9b9740091a2.tar.bz2
1 files changed, 8 insertions, 12 deletions
diff --git a/src/mesa/drivers/dri/i965/gen7_wm_state.c b/src/mesa/drivers/dri/i965/gen7_wm_state.c
index 2c3930f..945fbbd 100644
--- a/src/mesa/drivers/dri/i965/gen7_wm_state.c
+++ b/src/mesa/drivers/dri/i965/gen7_wm_state.c
@@ -91,7 +91,7 @@ upload_wm_state(struct brw_context *brw)
       else
          dw1 |= GEN7_WM_MSRAST_OFF_PIXEL;
 
-      if (_mesa_get_min_invocations_per_fragment(ctx, brw->fragment_program, false) > 1)
+      if (prog_data->persample_dispatch)
          dw2 |= GEN7_WM_MSDISPMODE_PERSAMPLE;
       else
          dw2 |= GEN7_WM_MSDISPMODE_PERPIXEL;
@@ -152,7 +152,6 @@ gen7_upload_ps_state(struct brw_context *brw,
                      bool enable_dual_src_blend, unsigned sample_mask,
                      unsigned fast_clear_op)
 {
-   struct gl_context *ctx = &brw->ctx;
    uint32_t dw2, dw4, dw5, ksp0, ksp2;
    const int max_threads_shift = brw->is_haswell ?
       HSW_PS_MAX_THREADS_SHIFT : IVB_PS_MAX_THREADS_SHIFT;
@@ -216,18 +215,15 @@ gen7_upload_ps_state(struct brw_context *brw,
    if (prog_data->num_varying_inputs != 0)
       dw4 |= GEN7_PS_ATTRIBUTE_ENABLE;
 
-   /* In case of non 1x per sample shading, only one of SIMD8 and SIMD16
-    * should be enabled. We do 'SIMD16 only' dispatch if a SIMD16 shader
-    * is successfully compiled. In majority of the cases that bring us
-    * better performance than 'SIMD8 only' dispatch.
-    */
-   int min_inv_per_frag =
-      _mesa_get_min_invocations_per_fragment(ctx, fp, false);
-   assert(min_inv_per_frag >= 1);
-
    if (prog_data->prog_offset_16 || prog_data->no_8) {
       dw4 |= GEN7_PS_16_DISPATCH_ENABLE;
-      if (!prog_data->no_8 && min_inv_per_frag == 1) {
+
+      /* In case of non 1x per sample shading, only one of SIMD8 and SIMD16
+       * should be enabled. We do 'SIMD16 only' dispatch if a SIMD16 shader
+       * is successfully compiled. In majority of the cases that bring us
+       * better performance than 'SIMD8 only' dispatch.
+       */
+      if (!prog_data->no_8 && !prog_data->persample_dispatch) {
          dw4 |= GEN7_PS_8_DISPATCH_ENABLE;
          dw5 |= (prog_data->base.dispatch_grf_start_reg <<
                  GEN7_PS_DISPATCH_START_GRF_SHIFT_0);
author	Jason Ekstrand <jason.ekstrand@intel.com>	2016-05-09 17:48:24 -0700
committer	Jason Ekstrand <jason.ekstrand@intel.com>	2016-05-14 13:34:05 -0700
commit	712a980adde0b14eee8b4accd02af9b9740091a2 (patch)
tree	7bb3fbc03b59eb51c491013c8bcf29bd2b7e0f8b /src/mesa/drivers/dri/i965/gen7_wm_state.c
parent	a2f50d87b6e9d07c6974ef309cc99acf56b2dc09 (diff)
download	external_mesa3d-712a980adde0b14eee8b4accd02af9b9740091a2.zip external_mesa3d-712a980adde0b14eee8b4accd02af9b9740091a2.tar.gz external_mesa3d-712a980adde0b14eee8b4accd02af9b9740091a2.tar.bz2