diff options
author | Iago Toral Quiroga <itoral@igalia.com> | 2016-01-04 16:02:47 +0100 |
---|---|---|
committer | Samuel Iglesias Gonsálvez <siglesias@igalia.com> | 2016-04-28 11:58:35 +0200 |
commit | 29541ec53175120f916a0ab74e5d82308aa9ef47 (patch) | |
tree | 270a230dde4cceba602b9f4bacf23cbd6f39f418 /src/compiler/nir/nir_lower_double_ops.c | |
parent | 5fab3d178b7093b0f0e5e98f09052f401ac714ad (diff) | |
download | external_mesa3d-29541ec53175120f916a0ab74e5d82308aa9ef47.zip external_mesa3d-29541ec53175120f916a0ab74e5d82308aa9ef47.tar.gz external_mesa3d-29541ec53175120f916a0ab74e5d82308aa9ef47.tar.bz2 |
nir/lower_double_ops: lower floor()
At least i965 hardware does not have native support for floor on doubles.
v2 (Sam):
- Improve the lowering pass to remove one bcsel (Jason)
Signed-off-by: Samuel Iglesias Gonsálvez <siglesias@igalia.com>
Reviewed-by: Jason Ekstrand <jason@jlekstrand.net>
Diffstat (limited to 'src/compiler/nir/nir_lower_double_ops.c')
-rw-r--r-- | src/compiler/nir/nir_lower_double_ops.c | 25 |
1 files changed, 25 insertions, 0 deletions
diff --git a/src/compiler/nir/nir_lower_double_ops.c b/src/compiler/nir/nir_lower_double_ops.c index e8ae884..1370ddf 100644 --- a/src/compiler/nir/nir_lower_double_ops.c +++ b/src/compiler/nir/nir_lower_double_ops.c @@ -351,6 +351,23 @@ lower_trunc(nir_builder *b, nir_ssa_def *src) nir_iand(b, mask_hi, src_hi)))); } +static nir_ssa_def * +lower_floor(nir_builder *b, nir_ssa_def *src) +{ + /* + * For x >= 0, floor(x) = trunc(x) + * For x < 0, + * - if x is integer, floor(x) = x + * - otherwise, floor(x) = trunc(x) - 1 + */ + nir_ssa_def *tr = nir_ftrunc(b, src); + nir_ssa_def *positive = nir_fge(b, src, nir_imm_double(b, 0.0)); + return nir_bcsel(b, + nir_ior(b, positive, nir_feq(b, src, tr)), + tr, + nir_fsub(b, tr, nir_imm_double(b, 1.0))); +} + static void lower_doubles_instr(nir_alu_instr *instr, nir_lower_doubles_options options) { @@ -379,6 +396,11 @@ lower_doubles_instr(nir_alu_instr *instr, nir_lower_doubles_options options) return; break; + case nir_op_ffloor: + if (!(options & nir_lower_dfloor)) + return; + break; + default: return; } @@ -405,6 +427,9 @@ lower_doubles_instr(nir_alu_instr *instr, nir_lower_doubles_options options) case nir_op_ftrunc: result = lower_trunc(&bld, src); break; + case nir_op_ffloor: + result = lower_floor(&bld, src); + break; default: unreachable("unhandled opcode"); } |