/************************************************************************** * * Copyright 2007 VMware, Inc. * All Rights Reserved. * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the * "Software"), to deal in the Software without restriction, including * without limitation the rights to use, copy, modify, merge, publish, * distribute, sub license, and/or sell copies of the Software, and to * permit persons to whom the Software is furnished to do so, subject to * the following conditions: * * The above copyright notice and this permission notice (including the * next paragraph) shall be included in all copies or substantial portions * of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. * **************************************************************************/ #include "util/u_debug.h" #include "pipe/p_shader_tokens.h" #include "tgsi_parse.h" #include "tgsi_util.h" #include "tgsi_exec.h" union pointer_hack { void *pointer; uint64_t uint64; }; void * tgsi_align_128bit( void *unaligned ) { union pointer_hack ph; ph.uint64 = 0; ph.pointer = unaligned; ph.uint64 = (ph.uint64 + 15) & ~15; return ph.pointer; } unsigned tgsi_util_get_src_register_swizzle( const struct tgsi_src_register *reg, unsigned component ) { switch (component) { case TGSI_CHAN_X: return reg->SwizzleX; case TGSI_CHAN_Y: return reg->SwizzleY; case TGSI_CHAN_Z: return reg->SwizzleZ; case TGSI_CHAN_W: return reg->SwizzleW; default: assert(0); } return 0; } unsigned tgsi_util_get_full_src_register_swizzle( const struct tgsi_full_src_register *reg, unsigned component ) { return tgsi_util_get_src_register_swizzle( ®->Register, component ); } void tgsi_util_set_src_register_swizzle( struct tgsi_src_register *reg, unsigned swizzle, unsigned component ) { switch( component ) { case 0: reg->SwizzleX = swizzle; break; case 1: reg->SwizzleY = swizzle; break; case 2: reg->SwizzleZ = swizzle; break; case 3: reg->SwizzleW = swizzle; break; default: assert( 0 ); } } unsigned tgsi_util_get_full_src_register_sign_mode( const struct tgsi_full_src_register *reg, unsigned component ) { unsigned sign_mode; if( reg->Register.Absolute ) { /* Consider only the post-abs negation. */ if( reg->Register.Negate ) { sign_mode = TGSI_UTIL_SIGN_SET; } else { sign_mode = TGSI_UTIL_SIGN_CLEAR; } } else { if( reg->Register.Negate ) { sign_mode = TGSI_UTIL_SIGN_TOGGLE; } else { sign_mode = TGSI_UTIL_SIGN_KEEP; } } return sign_mode; } void tgsi_util_set_full_src_register_sign_mode( struct tgsi_full_src_register *reg, unsigned sign_mode ) { switch (sign_mode) { case TGSI_UTIL_SIGN_CLEAR: reg->Register.Negate = 0; reg->Register.Absolute = 1; break; case TGSI_UTIL_SIGN_SET: reg->Register.Absolute = 1; reg->Register.Negate = 1; break; case TGSI_UTIL_SIGN_TOGGLE: reg->Register.Negate = 1; reg->Register.Absolute = 0; break; case TGSI_UTIL_SIGN_KEEP: reg->Register.Negate = 0; reg->Register.Absolute = 0; break; default: assert( 0 ); } } /** * Determine which channels of the specificed src register are effectively * used by this instruction. */ unsigned tgsi_util_get_inst_usage_mask(const struct tgsi_full_instruction *inst, unsigned src_idx) { const struct tgsi_full_src_register *src = &inst->Src[src_idx]; unsigned write_mask = inst->Dst[0].Register.WriteMask; unsigned read_mask; unsigned usage_mask; unsigned chan; switch (inst->Instruction.Opcode) { case TGSI_OPCODE_MOV: case TGSI_OPCODE_ARL: case TGSI_OPCODE_ARR: case TGSI_OPCODE_RCP: case TGSI_OPCODE_MUL: case TGSI_OPCODE_DIV: case TGSI_OPCODE_ADD: case TGSI_OPCODE_MIN: case TGSI_OPCODE_MAX: case TGSI_OPCODE_SLT: case TGSI_OPCODE_SGE: case TGSI_OPCODE_MAD: case TGSI_OPCODE_SUB: case TGSI_OPCODE_LRP: case TGSI_OPCODE_FMA: case TGSI_OPCODE_FRC: case TGSI_OPCODE_CEIL: case TGSI_OPCODE_CLAMP: case TGSI_OPCODE_FLR: case TGSI_OPCODE_ROUND: case TGSI_OPCODE_POW: case TGSI_OPCODE_ABS: case TGSI_OPCODE_COS: case TGSI_OPCODE_SIN: case TGSI_OPCODE_DDX: case TGSI_OPCODE_DDY: case TGSI_OPCODE_SEQ: case TGSI_OPCODE_SGT: case TGSI_OPCODE_SLE: case TGSI_OPCODE_SNE: case TGSI_OPCODE_SSG: case TGSI_OPCODE_CMP: case TGSI_OPCODE_TRUNC: case TGSI_OPCODE_NOT: case TGSI_OPCODE_AND: case TGSI_OPCODE_OR: case TGSI_OPCODE_XOR: case TGSI_OPCODE_SAD: case TGSI_OPCODE_FSEQ: case TGSI_OPCODE_FSGE: case TGSI_OPCODE_FSLT: case TGSI_OPCODE_FSNE: case TGSI_OPCODE_F2I: case TGSI_OPCODE_IDIV: case TGSI_OPCODE_IMAX: case TGSI_OPCODE_IMIN: case TGSI_OPCODE_INEG: case TGSI_OPCODE_ISGE: case TGSI_OPCODE_ISHR: case TGSI_OPCODE_ISLT: case TGSI_OPCODE_F2U: case TGSI_OPCODE_U2F: case TGSI_OPCODE_UADD: case TGSI_OPCODE_UDIV: case TGSI_OPCODE_UMAD: case TGSI_OPCODE_UMAX: case TGSI_OPCODE_UMIN: case TGSI_OPCODE_UMOD: case TGSI_OPCODE_UMUL: case TGSI_OPCODE_USEQ: case TGSI_OPCODE_USGE: case TGSI_OPCODE_USHR: case TGSI_OPCODE_USLT: case TGSI_OPCODE_USNE: case TGSI_OPCODE_IMUL_HI: case TGSI_OPCODE_UMUL_HI: case TGSI_OPCODE_DDX_FINE: case TGSI_OPCODE_DDY_FINE: /* Channel-wise operations */ read_mask = write_mask; break; case TGSI_OPCODE_EX2: case TGSI_OPCODE_LG2: read_mask = TGSI_WRITEMASK_X; break; case TGSI_OPCODE_SCS: read_mask = write_mask & TGSI_WRITEMASK_XY ? TGSI_WRITEMASK_X : 0; break; case TGSI_OPCODE_EXP: case TGSI_OPCODE_LOG: read_mask = write_mask & TGSI_WRITEMASK_XYZ ? TGSI_WRITEMASK_X : 0; break; case TGSI_OPCODE_DP2A: read_mask = src_idx == 2 ? TGSI_WRITEMASK_X : TGSI_WRITEMASK_XY; break; case TGSI_OPCODE_DP2: read_mask = TGSI_WRITEMASK_XY; break; case TGSI_OPCODE_DP3: read_mask = TGSI_WRITEMASK_XYZ; break; case TGSI_OPCODE_DP4: read_mask = TGSI_WRITEMASK_XYZW; break; case TGSI_OPCODE_DPH: read_mask = src_idx == 0 ? TGSI_WRITEMASK_XYZ : TGSI_WRITEMASK_XYZW; break; case TGSI_OPCODE_TEX: case TGSI_OPCODE_TXD: case TGSI_OPCODE_TXB: case TGSI_OPCODE_TXL: case TGSI_OPCODE_TXP: if (src_idx == 0) { /* Note that the SHADOW variants use the Z component too */ switch (inst->Texture.Texture) { case TGSI_TEXTURE_1D: read_mask = TGSI_WRITEMASK_X; break; case TGSI_TEXTURE_SHADOW1D: read_mask = TGSI_WRITEMASK_XZ; break; case TGSI_TEXTURE_1D_ARRAY: case TGSI_TEXTURE_2D: case TGSI_TEXTURE_RECT: read_mask = TGSI_WRITEMASK_XY; break; case TGSI_TEXTURE_SHADOW1D_ARRAY: case TGSI_TEXTURE_SHADOW2D: case TGSI_TEXTURE_SHADOWRECT: case TGSI_TEXTURE_2D_ARRAY: case TGSI_TEXTURE_3D: case TGSI_TEXTURE_CUBE: case TGSI_TEXTURE_2D_MSAA: read_mask = TGSI_WRITEMASK_XYZ; break; case TGSI_TEXTURE_SHADOW2D_ARRAY: case TGSI_TEXTURE_CUBE_ARRAY: case TGSI_TEXTURE_SHADOWCUBE: case TGSI_TEXTURE_2D_ARRAY_MSAA: case TGSI_TEXTURE_SHADOWCUBE_ARRAY: read_mask = TGSI_WRITEMASK_XYZW; break; default: assert(0); read_mask = 0; } if (inst->Instruction.Opcode != TGSI_OPCODE_TEX) { read_mask |= TGSI_WRITEMASK_W; } } else { /* A safe approximation */ read_mask = TGSI_WRITEMASK_XYZW; } break; default: /* Assume all channels are read */ read_mask = TGSI_WRITEMASK_XYZW; break; } usage_mask = 0; for (chan = 0; chan < 4; ++chan) { if (read_mask & (1 << chan)) { usage_mask |= 1 << tgsi_util_get_full_src_register_swizzle(src, chan); } } return usage_mask; } /** * Convert a tgsi_ind_register into a tgsi_src_register */ struct tgsi_src_register tgsi_util_get_src_from_ind(const struct tgsi_ind_register *reg) { struct tgsi_src_register src = { 0 }; src.File = reg->File; src.Index = reg->Index; src.SwizzleX = reg->Swizzle; src.SwizzleY = reg->Swizzle; src.SwizzleZ = reg->Swizzle; src.SwizzleW = reg->Swizzle; return src; } /** * Return the dimension of the texture coordinates (layer included for array * textures), as well as the location of the shadow reference value or the * sample index. */ int tgsi_util_get_texture_coord_dim(unsigned tgsi_tex) { /* * Depending on the texture target, (src0.xyzw, src1.x) is interpreted * differently: * * (s, X, X, X, X), for BUFFER * (s, X, X, X, X), for 1D * (s, t, X, X, X), for 2D, RECT * (s, t, r, X, X), for 3D, CUBE * * (s, layer, X, X, X), for 1D_ARRAY * (s, t, layer, X, X), for 2D_ARRAY * (s, t, r, layer, X), for CUBE_ARRAY * * (s, X, shadow, X, X), for SHADOW1D * (s, t, shadow, X, X), for SHADOW2D, SHADOWRECT * (s, t, r, shadow, X), for SHADOWCUBE * * (s, layer, shadow, X, X), for SHADOW1D_ARRAY * (s, t, layer, shadow, X), for SHADOW2D_ARRAY * (s, t, r, layer, shadow), for SHADOWCUBE_ARRAY * * (s, t, sample, X, X), for 2D_MSAA * (s, t, layer, sample, X), for 2D_ARRAY_MSAA */ switch (tgsi_tex) { case TGSI_TEXTURE_BUFFER: case TGSI_TEXTURE_1D: case TGSI_TEXTURE_SHADOW1D: return 1; case TGSI_TEXTURE_2D: case TGSI_TEXTURE_RECT: case TGSI_TEXTURE_1D_ARRAY: case TGSI_TEXTURE_SHADOW2D: case TGSI_TEXTURE_SHADOWRECT: case TGSI_TEXTURE_SHADOW1D_ARRAY: case TGSI_TEXTURE_2D_MSAA: return 2; case TGSI_TEXTURE_3D: case TGSI_TEXTURE_CUBE: case TGSI_TEXTURE_2D_ARRAY: case TGSI_TEXTURE_SHADOWCUBE: case TGSI_TEXTURE_SHADOW2D_ARRAY: case TGSI_TEXTURE_2D_ARRAY_MSAA: return 3; case TGSI_TEXTURE_CUBE_ARRAY: case TGSI_TEXTURE_SHADOWCUBE_ARRAY: return 4; default: assert(!"unknown texture target"); return 0; } } /** * Given a TGSI_TEXTURE_x target, return the src register index for the * shadow reference coordinate. */ int tgsi_util_get_shadow_ref_src_index(unsigned tgsi_tex) { switch (tgsi_tex) { case TGSI_TEXTURE_SHADOW1D: case TGSI_TEXTURE_SHADOW2D: case TGSI_TEXTURE_SHADOWRECT: case TGSI_TEXTURE_SHADOW1D_ARRAY: return 2; case TGSI_TEXTURE_SHADOWCUBE: case TGSI_TEXTURE_SHADOW2D_ARRAY: case TGSI_TEXTURE_2D_MSAA: case TGSI_TEXTURE_2D_ARRAY_MSAA: return 3; case TGSI_TEXTURE_SHADOWCUBE_ARRAY: return 4; default: /* no shadow nor sample */ return -1; } } boolean tgsi_is_shadow_target(unsigned target) { switch (target) { case TGSI_TEXTURE_SHADOW1D: case TGSI_TEXTURE_SHADOW2D: case TGSI_TEXTURE_SHADOWRECT: case TGSI_TEXTURE_SHADOW1D_ARRAY: case TGSI_TEXTURE_SHADOW2D_ARRAY: case TGSI_TEXTURE_SHADOWCUBE: case TGSI_TEXTURE_SHADOWCUBE_ARRAY: return TRUE; default: return FALSE; } }