i965: Port INTEL_PRECISE_TRIG=1 to NIR.

This makes the extra multiply visible to NIR's algebraic optimizations (for constant reassociation) as well as constant folding. This means that when the result of sin/cos are multiplied by an constant, we can eliminate the extra multiply altogether, reducing the cost of the workaround. It also means we only have to implement it one place, rather than in both backends. This makes INTEL_PRECISE_TRIG=1 cost nothing on GPUTest/Volplosion, which has a ton of sin() calls, but always multiplies them by an immediate constant. The extra multiply gets folded away. Signed-off-by: Kenneth Graunke <kenneth@whitecape.org> Reviewed-by: Eduardo Lima Mitev <elima@igalia.com> Reviewed-by: Jason Ekstrand <jason@jlekstrand.net> Reviewed-by: Matt Turner <mattst88@gmail.com>
author: Kenneth Graunke <kenneth@whitecape.org> 2016-04-07 15:04:35 -0700
committer: Kenneth Graunke <kenneth@whitecape.org> 2016-04-11 18:44:17 -0700
commit: bfd17c76c1267756ea16051cbe174cb23ff49f44 (patch)
tree: b451c81beb61d850f0f726fc8437e81384cb39ee /src/mesa/drivers/dri/i965/brw_vec4_nir.cpp
parent: b0dffdc616801a1fd8534502e11ac840369041ab (diff)
download: external_mesa3d-bfd17c76c1267756ea16051cbe174cb23ff49f44.zip
external_mesa3d-bfd17c76c1267756ea16051cbe174cb23ff49f44.tar.gz
external_mesa3d-bfd17c76c1267756ea16051cbe174cb23ff49f44.tar.bz2
1 files changed, 2 insertions, 14 deletions
diff --git a/src/mesa/drivers/dri/i965/brw_vec4_nir.cpp b/src/mesa/drivers/dri/i965/brw_vec4_nir.cpp
index d9f96c5..e4e8c38 100644
--- a/src/mesa/drivers/dri/i965/brw_vec4_nir.cpp
+++ b/src/mesa/drivers/dri/i965/brw_vec4_nir.cpp
@@ -1101,24 +1101,12 @@ vec4_visitor::nir_emit_alu(nir_alu_instr *instr)
       break;
 
    case nir_op_fsin:
-      if (!compiler->precise_trig) {
-         inst = emit_math(SHADER_OPCODE_SIN, dst, op[0]);
-      } else {
-         src_reg tmp = src_reg(this, glsl_type::vec4_type);
-         inst = emit_math(SHADER_OPCODE_SIN, dst_reg(tmp), op[0]);
-         inst = emit(MUL(dst, tmp, brw_imm_f(0.99997)));
-      }
+      inst = emit_math(SHADER_OPCODE_SIN, dst, op[0]);
       inst->saturate = instr->dest.saturate;
       break;
 
    case nir_op_fcos:
-      if (!compiler->precise_trig) {
-         inst = emit_math(SHADER_OPCODE_COS, dst, op[0]);
-      } else {
-         src_reg tmp = src_reg(this, glsl_type::vec4_type);
-         inst = emit_math(SHADER_OPCODE_COS, dst_reg(tmp), op[0]);
-         inst = emit(MUL(dst, tmp, brw_imm_f(0.99997)));
-      }
+      inst = emit_math(SHADER_OPCODE_COS, dst, op[0]);
       inst->saturate = instr->dest.saturate;
       break;
author	Kenneth Graunke <kenneth@whitecape.org>	2016-04-07 15:04:35 -0700
committer	Kenneth Graunke <kenneth@whitecape.org>	2016-04-11 18:44:17 -0700
commit	bfd17c76c1267756ea16051cbe174cb23ff49f44 (patch)
tree	b451c81beb61d850f0f726fc8437e81384cb39ee /src/mesa/drivers/dri/i965/brw_vec4_nir.cpp
parent	b0dffdc616801a1fd8534502e11ac840369041ab (diff)
download	external_mesa3d-bfd17c76c1267756ea16051cbe174cb23ff49f44.zip external_mesa3d-bfd17c76c1267756ea16051cbe174cb23ff49f44.tar.gz external_mesa3d-bfd17c76c1267756ea16051cbe174cb23ff49f44.tar.bz2