Home | History | Annotate | Download | only in i915
      1 /**************************************************************************
      2  *
      3  * Copyright 2003 VMware, Inc.
      4  * All Rights Reserved.
      5  *
      6  * Permission is hereby granted, free of charge, to any person obtaining a
      7  * copy of this software and associated documentation files (the
      8  * "Software"), to deal in the Software without restriction, including
      9  * without limitation the rights to use, copy, modify, merge, publish,
     10  * distribute, sub license, and/or sell copies of the Software, and to
     11  * permit persons to whom the Software is furnished to do so, subject to
     12  * the following conditions:
     13  *
     14  * The above copyright notice and this permission notice (including the
     15  * next paragraph) shall be included in all copies or substantial portions
     16  * of the Software.
     17  *
     18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
     19  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
     20  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
     21  * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
     22  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
     23  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
     24  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
     25  *
     26  **************************************************************************/
     27 
     28 
     29 #ifndef I915_FPC_H
     30 #define I915_FPC_H
     31 
     32 
     33 #include "i915_context.h"
     34 #include "i915_reg.h"
     35 
     36 #include "pipe/p_shader_tokens.h"
     37 
     38 #include "tgsi/tgsi_parse.h"
     39 
     40 #define I915_PROGRAM_SIZE 192
     41 
     42 /* Use those indices for pos/face routing, must be >= num of inputs */
     43 #define I915_SEMANTIC_POS  100
     44 #define I915_SEMANTIC_FACE 101
     45 
     46 
     47 /**
     48  * Program translation state
     49  */
     50 struct i915_fp_compile {
     51    struct i915_fragment_shader *shader;  /* the shader we're compiling */
     52 
     53    boolean used_constants[I915_MAX_CONSTANT];
     54 
     55    /** maps TGSI immediate index to constant slot */
     56    uint num_immediates;
     57    uint immediates_map[I915_MAX_CONSTANT];
     58    float immediates[I915_MAX_CONSTANT][4];
     59 
     60    boolean first_instruction;
     61 
     62    uint declarations[I915_PROGRAM_SIZE];
     63    uint program[I915_PROGRAM_SIZE];
     64 
     65    uint *csr;            /**< Cursor, points into program. */
     66 
     67    uint *decl;           /**< Cursor, points into declarations. */
     68 
     69    uint decl_s;          /**< flags for which s regs need to be decl'd */
     70    uint decl_t;          /**< flags for which t regs need to be decl'd */
     71 
     72    uint temp_flag;       /**< Tracks temporary regs which are in use */
     73    uint utemp_flag;      /**< Tracks TYPE_U temporary regs which are in use */
     74 
     75    uint register_phases[I915_MAX_TEMPORARY];
     76    uint nr_tex_indirect;
     77    uint nr_tex_insn;
     78    uint nr_alu_insn;
     79    uint nr_decl_insn;
     80 
     81    boolean error;      /**< Set if i915_program_error() is called */
     82    uint NumNativeInstructions;
     83    uint NumNativeAluInstructions;
     84    uint NumNativeTexInstructions;
     85    uint NumNativeTexIndirections;
     86 };
     87 
     88 
     89 /* Having zero and one in here makes the definition of swizzle a lot
     90  * easier.
     91  */
     92 #define UREG_TYPE_SHIFT               29
     93 #define UREG_NR_SHIFT                 24
     94 #define UREG_CHANNEL_X_NEGATE_SHIFT   23
     95 #define UREG_CHANNEL_X_SHIFT          20
     96 #define UREG_CHANNEL_Y_NEGATE_SHIFT   19
     97 #define UREG_CHANNEL_Y_SHIFT          16
     98 #define UREG_CHANNEL_Z_NEGATE_SHIFT   15
     99 #define UREG_CHANNEL_Z_SHIFT          12
    100 #define UREG_CHANNEL_W_NEGATE_SHIFT   11
    101 #define UREG_CHANNEL_W_SHIFT          8
    102 #define UREG_CHANNEL_ZERO_NEGATE_MBZ  5
    103 #define UREG_CHANNEL_ZERO_SHIFT       4
    104 #define UREG_CHANNEL_ONE_NEGATE_MBZ   1
    105 #define UREG_CHANNEL_ONE_SHIFT        0
    106 
    107 #define UREG_BAD          0xffffffff    /* not a valid ureg */
    108 
    109 #define X    SRC_X
    110 #define Y    SRC_Y
    111 #define Z    SRC_Z
    112 #define W    SRC_W
    113 #define ZERO SRC_ZERO
    114 #define ONE  SRC_ONE
    115 
    116 /* Construct a ureg:
    117  */
    118 #define UREG( type, nr ) (((type)<< UREG_TYPE_SHIFT) |		\
    119 			  ((nr)  << UREG_NR_SHIFT) |		\
    120 			  (X     << UREG_CHANNEL_X_SHIFT) |	\
    121 			  (Y     << UREG_CHANNEL_Y_SHIFT) |	\
    122 			  (Z     << UREG_CHANNEL_Z_SHIFT) |	\
    123 			  (W     << UREG_CHANNEL_W_SHIFT) |	\
    124 			  (ZERO  << UREG_CHANNEL_ZERO_SHIFT) |	\
    125 			  (ONE   << UREG_CHANNEL_ONE_SHIFT))
    126 
    127 #define GET_CHANNEL_SRC( reg, channel ) ((reg<<(channel*4)) & (0xf<<20))
    128 #define CHANNEL_SRC( src, channel ) (src>>(channel*4))
    129 
    130 #define GET_UREG_TYPE(reg) (((reg)>>UREG_TYPE_SHIFT)&REG_TYPE_MASK)
    131 #define GET_UREG_NR(reg)   (((reg)>>UREG_NR_SHIFT)&REG_NR_MASK)
    132 
    133 
    134 
    135 #define UREG_XYZW_CHANNEL_MASK 0x00ffff00
    136 
    137 /* One neat thing about the UREG representation:
    138  */
    139 static inline int
    140 swizzle(int reg, uint x, uint y, uint z, uint w)
    141 {
    142    assert(x <= SRC_ONE);
    143    assert(y <= SRC_ONE);
    144    assert(z <= SRC_ONE);
    145    assert(w <= SRC_ONE);
    146    return ((reg & ~UREG_XYZW_CHANNEL_MASK) |
    147            CHANNEL_SRC(GET_CHANNEL_SRC(reg, x), 0) |
    148            CHANNEL_SRC(GET_CHANNEL_SRC(reg, y), 1) |
    149            CHANNEL_SRC(GET_CHANNEL_SRC(reg, z), 2) |
    150            CHANNEL_SRC(GET_CHANNEL_SRC(reg, w), 3));
    151 }
    152 
    153 
    154 #define A0_DEST( reg ) (((reg)&UREG_TYPE_NR_MASK)>>UREG_A0_DEST_SHIFT_LEFT)
    155 #define D0_DEST( reg ) (((reg)&UREG_TYPE_NR_MASK)>>UREG_A0_DEST_SHIFT_LEFT)
    156 #define T0_DEST( reg ) (((reg)&UREG_TYPE_NR_MASK)>>UREG_A0_DEST_SHIFT_LEFT)
    157 #define A0_SRC0( reg ) (((reg)&UREG_MASK)>>UREG_A0_SRC0_SHIFT_LEFT)
    158 #define A1_SRC0( reg ) (((reg)&UREG_MASK)<<UREG_A1_SRC0_SHIFT_RIGHT)
    159 #define A1_SRC1( reg ) (((reg)&UREG_MASK)>>UREG_A1_SRC1_SHIFT_LEFT)
    160 #define A2_SRC1( reg ) (((reg)&UREG_MASK)<<UREG_A2_SRC1_SHIFT_RIGHT)
    161 #define A2_SRC2( reg ) (((reg)&UREG_MASK)>>UREG_A2_SRC2_SHIFT_LEFT)
    162 
    163 /* These are special, and don't have swizzle/negate bits.
    164  */
    165 #define T0_SAMPLER( reg )     (GET_UREG_NR(reg)<<T0_SAMPLER_NR_SHIFT)
    166 #define T1_ADDRESS_REG( reg ) ((GET_UREG_NR(reg)<<T1_ADDRESS_REG_NR_SHIFT) | \
    167 			       (GET_UREG_TYPE(reg)<<T1_ADDRESS_REG_TYPE_SHIFT))
    168 
    169 
    170 /* Macros for translating UREG's into the various register fields used
    171  * by the I915 programmable unit.
    172  */
    173 #define UREG_A0_DEST_SHIFT_LEFT  (UREG_TYPE_SHIFT - A0_DEST_TYPE_SHIFT)
    174 #define UREG_A0_SRC0_SHIFT_LEFT  (UREG_TYPE_SHIFT - A0_SRC0_TYPE_SHIFT)
    175 #define UREG_A1_SRC0_SHIFT_RIGHT (A1_SRC0_CHANNEL_W_SHIFT - UREG_CHANNEL_W_SHIFT)
    176 #define UREG_A1_SRC1_SHIFT_LEFT  (UREG_TYPE_SHIFT - A1_SRC1_TYPE_SHIFT)
    177 #define UREG_A2_SRC1_SHIFT_RIGHT (A2_SRC1_CHANNEL_W_SHIFT - UREG_CHANNEL_W_SHIFT)
    178 #define UREG_A2_SRC2_SHIFT_LEFT  (UREG_TYPE_SHIFT - A2_SRC2_TYPE_SHIFT)
    179 
    180 #define UREG_MASK         0xffffff00
    181 #define UREG_TYPE_NR_MASK ((REG_TYPE_MASK << UREG_TYPE_SHIFT) | \
    182   			   (REG_NR_MASK << UREG_NR_SHIFT))
    183 
    184 
    185 
    186 
    187 /***********************************************************************
    188  * Public interface for the compiler
    189  */
    190 extern void
    191 i915_translate_fragment_program( struct i915_context *i915,
    192                                  struct i915_fragment_shader *fs);
    193 
    194 
    195 
    196 extern uint i915_get_temp(struct i915_fp_compile *p);
    197 extern uint i915_get_utemp(struct i915_fp_compile *p);
    198 extern void i915_release_utemps(struct i915_fp_compile *p);
    199 
    200 
    201 extern uint i915_emit_texld(struct i915_fp_compile *p,
    202                               uint dest,
    203                               uint destmask,
    204                               uint sampler,
    205                               uint coord,
    206                               uint op,
    207                               uint num_coord);
    208 
    209 extern uint i915_emit_arith(struct i915_fp_compile *p,
    210                               uint op,
    211                               uint dest,
    212                               uint mask,
    213                               uint saturate,
    214                               uint src0, uint src1, uint src2);
    215 
    216 extern uint i915_emit_decl(struct i915_fp_compile *p,
    217                              uint type, uint nr, uint d0_flags);
    218 
    219 
    220 extern uint i915_emit_const1f(struct i915_fp_compile *p, float c0);
    221 
    222 extern uint i915_emit_const2f(struct i915_fp_compile *p,
    223                                 float c0, float c1);
    224 
    225 extern uint i915_emit_const4fv(struct i915_fp_compile *p,
    226                                  const float * c);
    227 
    228 extern uint i915_emit_const4f(struct i915_fp_compile *p,
    229                                 float c0, float c1,
    230                                 float c2, float c3);
    231 
    232 
    233 /*======================================================================
    234  * i915_fpc_translate.c
    235  */
    236 
    237 extern void
    238 i915_program_error(struct i915_fp_compile *p, const char *msg, ...);
    239 
    240 
    241 /*======================================================================
    242  * i915_fpc_optimize.c
    243  */
    244 
    245 
    246 struct i915_src_register
    247 {
    248    unsigned File        : 4;  /* TGSI_FILE_ */
    249    unsigned Indirect    : 1;  /* BOOL */
    250    unsigned Dimension   : 1;  /* BOOL */
    251    int      Index       : 16; /* SINT */
    252    unsigned SwizzleX    : 3;  /* TGSI_SWIZZLE_ */
    253    unsigned SwizzleY    : 3;  /* TGSI_SWIZZLE_ */
    254    unsigned SwizzleZ    : 3;  /* TGSI_SWIZZLE_ */
    255    unsigned SwizzleW    : 3;  /* TGSI_SWIZZLE_ */
    256    unsigned Absolute    : 1;    /* BOOL */
    257    unsigned Negate      : 1;    /* BOOL */
    258 };
    259 
    260 /* Additional swizzle supported in i915 */
    261 #define TGSI_SWIZZLE_ZERO 4
    262 #define TGSI_SWIZZLE_ONE 5
    263 
    264 struct i915_dst_register
    265 {
    266    unsigned File        : 4;  /* TGSI_FILE_ */
    267    unsigned WriteMask   : 4;  /* TGSI_WRITEMASK_ */
    268    unsigned Indirect    : 1;  /* BOOL */
    269    unsigned Dimension   : 1;  /* BOOL */
    270    int      Index       : 16; /* SINT */
    271    unsigned Padding     : 6;
    272 };
    273 
    274 
    275 struct i915_full_dst_register
    276 {
    277    struct i915_dst_register               Register;
    278 /*
    279    struct tgsi_ind_register               Indirect;
    280    struct tgsi_dimension                  Dimension;
    281    struct tgsi_ind_register               DimIndirect;
    282 */
    283 };
    284 
    285 struct i915_full_src_register
    286 {
    287    struct i915_src_register         Register;
    288 /*
    289    struct tgsi_ind_register         Indirect;
    290    struct tgsi_dimension            Dimension;
    291    struct tgsi_ind_register         DimIndirect;
    292 */
    293 };
    294 
    295 struct i915_full_instruction
    296 {
    297    struct tgsi_instruction             Instruction;
    298 /*
    299    struct tgsi_instruction_predicate   Predicate;
    300    struct tgsi_instruction_label       Label;
    301 */
    302    struct tgsi_instruction_texture     Texture;
    303    struct i915_full_dst_register       Dst[1];
    304    struct i915_full_src_register       Src[3];
    305 };
    306 
    307 
    308 union i915_full_token
    309 {
    310    struct tgsi_token             Token;
    311    struct tgsi_full_declaration  FullDeclaration;
    312    struct tgsi_full_immediate    FullImmediate;
    313    struct i915_full_instruction  FullInstruction;
    314    struct tgsi_full_property     FullProperty;
    315 };
    316 
    317 struct i915_token_list
    318 {
    319    union i915_full_token*     Tokens;
    320    unsigned                   NumTokens;
    321 };
    322 
    323 extern struct i915_token_list* i915_optimize(const struct tgsi_token *tokens);
    324 
    325 extern void i915_optimize_free(struct i915_token_list *tokens);
    326 
    327 extern uint i915_num_coords(uint tex);
    328 
    329 #endif
    330