Home | History | Annotate | Download | only in blorp
      1 /*
      2  * Copyright  2012 Intel Corporation
      3  *
      4  * Permission is hereby granted, free of charge, to any person obtaining a
      5  * copy of this software and associated documentation files (the "Software"),
      6  * to deal in the Software without restriction, including without limitation
      7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
      8  * and/or sell copies of the Software, and to permit persons to whom the
      9  * Software is furnished to do so, subject to the following conditions:
     10  *
     11  * The above copyright notice and this permission notice (including the next
     12  * paragraph) shall be included in all copies or substantial portions of the
     13  * Software.
     14  *
     15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
     18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
     19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
     20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
     21  * IN THE SOFTWARE.
     22  */
     23 
     24 #ifndef BLORP_PRIV_H
     25 #define BLORP_PRIV_H
     26 
     27 #include <stdint.h>
     28 
     29 #include "compiler/nir/nir.h"
     30 #include "compiler/brw_compiler.h"
     31 
     32 #include "blorp.h"
     33 
     34 #ifdef __cplusplus
     35 extern "C" {
     36 #endif
     37 
     38 /**
     39  * Binding table indices used by BLORP.
     40  */
     41 enum {
     42    BLORP_RENDERBUFFER_BT_INDEX,
     43    BLORP_TEXTURE_BT_INDEX,
     44    BLORP_NUM_BT_ENTRIES
     45 };
     46 
     47 struct brw_blorp_surface_info
     48 {
     49    bool enabled;
     50 
     51    struct isl_surf surf;
     52    struct blorp_address addr;
     53 
     54    struct isl_surf aux_surf;
     55    struct blorp_address aux_addr;
     56    enum isl_aux_usage aux_usage;
     57 
     58    union isl_color_value clear_color;
     59    struct blorp_address clear_color_addr;
     60 
     61    struct isl_view view;
     62 
     63    /* Z offset into a 3-D texture or slice of a 2-D array texture. */
     64    uint32_t z_offset;
     65 
     66    uint32_t tile_x_sa, tile_y_sa;
     67 };
     68 
     69 void
     70 brw_blorp_surface_info_init(struct blorp_context *blorp,
     71                             struct brw_blorp_surface_info *info,
     72                             const struct blorp_surf *surf,
     73                             unsigned int level, unsigned int layer,
     74                             enum isl_format format, bool is_render_target);
     75 void
     76 blorp_surf_convert_to_single_slice(const struct isl_device *isl_dev,
     77                                    struct brw_blorp_surface_info *info);
     78 void
     79 blorp_surf_convert_to_uncompressed(const struct isl_device *isl_dev,
     80                                    struct brw_blorp_surface_info *info,
     81                                    uint32_t *x, uint32_t *y,
     82                                    uint32_t *width, uint32_t *height);
     83 
     84 
     85 struct brw_blorp_coord_transform
     86 {
     87    float multiplier;
     88    float offset;
     89 };
     90 
     91 /**
     92  * Bounding rectangle telling pixel discard which pixels are not to be
     93  * touched. This is needed in when surfaces are configured as something else
     94  * what they really are:
     95  *
     96  *    - writing W-tiled stencil as Y-tiled
     97  *    - writing interleaved multisampled as single sampled.
     98  *
     99  * See blorp_nir_discard_if_outside_rect().
    100  */
    101 struct brw_blorp_discard_rect
    102 {
    103    uint32_t x0;
    104    uint32_t x1;
    105    uint32_t y0;
    106    uint32_t y1;
    107 };
    108 
    109 /**
    110  * Grid needed for blended and scaled blits of integer formats, see
    111  * blorp_nir_manual_blend_bilinear().
    112  */
    113 struct brw_blorp_rect_grid
    114 {
    115    float x1;
    116    float y1;
    117    float pad[2];
    118 };
    119 
    120 struct blorp_surf_offset {
    121    uint32_t x;
    122    uint32_t y;
    123 };
    124 
    125 struct brw_blorp_wm_inputs
    126 {
    127    uint32_t clear_color[4];
    128 
    129    struct brw_blorp_discard_rect discard_rect;
    130    struct brw_blorp_rect_grid rect_grid;
    131    struct brw_blorp_coord_transform coord_transform[2];
    132 
    133    struct blorp_surf_offset src_offset;
    134    struct blorp_surf_offset dst_offset;
    135 
    136    /* (1/width, 1/height) for the source surface */
    137    float src_inv_size[2];
    138 
    139    /* Minimum layer setting works for all the textures types but texture_3d
    140     * for which the setting has no effect. Use the z-coordinate instead.
    141     */
    142    uint32_t src_z;
    143 
    144    /* Pad out to an integral number of registers */
    145    uint32_t pad[1];
    146 };
    147 
    148 #define BLORP_CREATE_NIR_INPUT(shader, name, type) ({ \
    149    nir_variable *input = nir_variable_create((shader), nir_var_shader_in, \
    150                                              type, #name); \
    151    if ((shader)->info.stage == MESA_SHADER_FRAGMENT) \
    152       input->data.interpolation = INTERP_MODE_FLAT; \
    153    input->data.location = VARYING_SLOT_VAR0 + \
    154       offsetof(struct brw_blorp_wm_inputs, name) / (4 * sizeof(float)); \
    155    input->data.location_frac = \
    156       (offsetof(struct brw_blorp_wm_inputs, name) / sizeof(float)) % 4; \
    157    input; \
    158 })
    159 
    160 struct blorp_vs_inputs {
    161    uint32_t base_layer;
    162    uint32_t _instance_id; /* Set in hardware by SGVS */
    163    uint32_t pad[2];
    164 };
    165 
    166 static inline unsigned
    167 brw_blorp_get_urb_length(const struct brw_wm_prog_data *prog_data)
    168 {
    169    if (prog_data == NULL)
    170       return 1;
    171 
    172    /* From the BSpec: 3D Pipeline - Strips and Fans - 3DSTATE_SBE
    173     *
    174     * read_length = ceiling((max_source_attr+1)/2)
    175     */
    176    return MAX2((prog_data->num_varying_inputs + 1) / 2, 1);
    177 }
    178 
    179 struct blorp_params
    180 {
    181    uint32_t x0;
    182    uint32_t y0;
    183    uint32_t x1;
    184    uint32_t y1;
    185    float z;
    186    uint8_t stencil_mask;
    187    uint8_t stencil_ref;
    188    struct brw_blorp_surface_info depth;
    189    struct brw_blorp_surface_info stencil;
    190    uint32_t depth_format;
    191    struct brw_blorp_surface_info src;
    192    struct brw_blorp_surface_info dst;
    193    enum blorp_hiz_op hiz_op;
    194    bool full_surface_hiz_op;
    195    enum blorp_fast_clear_op fast_clear_op;
    196    bool color_write_disable[4];
    197    struct brw_blorp_wm_inputs wm_inputs;
    198    struct blorp_vs_inputs vs_inputs;
    199    unsigned num_samples;
    200    unsigned num_draw_buffers;
    201    unsigned num_layers;
    202    uint32_t vs_prog_kernel;
    203    struct brw_vs_prog_data *vs_prog_data;
    204    uint32_t sf_prog_kernel;
    205    struct brw_sf_prog_data *sf_prog_data;
    206    uint32_t wm_prog_kernel;
    207    struct brw_wm_prog_data *wm_prog_data;
    208 
    209    bool use_pre_baked_binding_table;
    210    uint32_t pre_baked_binding_table_offset;
    211 };
    212 
    213 void blorp_params_init(struct blorp_params *params);
    214 
    215 enum blorp_shader_type {
    216    BLORP_SHADER_TYPE_BLIT,
    217    BLORP_SHADER_TYPE_CLEAR,
    218    BLORP_SHADER_TYPE_MCS_PARTIAL_RESOLVE,
    219    BLORP_SHADER_TYPE_LAYER_OFFSET_VS,
    220    BLORP_SHADER_TYPE_GEN4_SF,
    221 };
    222 
    223 struct brw_blorp_blit_prog_key
    224 {
    225    enum blorp_shader_type shader_type; /* Must be BLORP_SHADER_TYPE_BLIT */
    226 
    227    /* Number of samples per pixel that have been configured in the surface
    228     * state for texturing from.
    229     */
    230    unsigned tex_samples;
    231 
    232    /* MSAA layout that has been configured in the surface state for texturing
    233     * from.
    234     */
    235    enum isl_msaa_layout tex_layout;
    236 
    237    enum isl_aux_usage tex_aux_usage;
    238 
    239    /* Actual number of samples per pixel in the source image. */
    240    unsigned src_samples;
    241 
    242    /* Actual MSAA layout used by the source image. */
    243    enum isl_msaa_layout src_layout;
    244 
    245    /* Number of bits per channel in the source image. */
    246    uint8_t src_bpc;
    247 
    248    /* True if the source requires normalized coordinates */
    249    bool src_coords_normalized;
    250 
    251    /* Number of samples per pixel that have been configured in the render
    252     * target.
    253     */
    254    unsigned rt_samples;
    255 
    256    /* MSAA layout that has been configured in the render target. */
    257    enum isl_msaa_layout rt_layout;
    258 
    259    /* Actual number of samples per pixel in the destination image. */
    260    unsigned dst_samples;
    261 
    262    /* Actual MSAA layout used by the destination image. */
    263    enum isl_msaa_layout dst_layout;
    264 
    265    /* Number of bits per channel in the destination image. */
    266    uint8_t dst_bpc;
    267 
    268    /* Type of the data to be read from the texture (one of
    269     * nir_type_(int|uint|float)).
    270     */
    271    nir_alu_type texture_data_type;
    272 
    273    /* True if the source image is W tiled.  If true, the surface state for the
    274     * source image must be configured as Y tiled, and tex_samples must be 0.
    275     */
    276    bool src_tiled_w;
    277 
    278    /* True if the destination image is W tiled.  If true, the surface state
    279     * for the render target must be configured as Y tiled, and rt_samples must
    280     * be 0.
    281     */
    282    bool dst_tiled_w;
    283 
    284    /* True if the destination is an RGB format.  If true, the surface state
    285     * for the render target must be configured as red with three times the
    286     * normal width.  We need to do this because you cannot render to
    287     * non-power-of-two formats.
    288     */
    289    bool dst_rgb;
    290 
    291    /* True if all source samples should be blended together to produce each
    292     * destination pixel.  If true, src_tiled_w must be false, tex_samples must
    293     * equal src_samples, and tex_samples must be nonzero.
    294     */
    295    bool blend;
    296 
    297    /* True if the rectangle being sent through the rendering pipeline might be
    298     * larger than the destination rectangle, so the WM program should kill any
    299     * pixels that are outside the destination rectangle.
    300     */
    301    bool use_kill;
    302 
    303    /**
    304     * True if the WM program should be run in MSDISPMODE_PERSAMPLE with more
    305     * than one sample per pixel.
    306     */
    307    bool persample_msaa_dispatch;
    308 
    309    /* True for scaled blitting. */
    310    bool blit_scaled;
    311 
    312    /* True if this blit operation may involve intratile offsets on the source.
    313     * In this case, we need to add the offset before texturing.
    314     */
    315    bool need_src_offset;
    316 
    317    /* True if this blit operation may involve intratile offsets on the
    318     * destination.  In this case, we need to add the offset to gl_FragCoord.
    319     */
    320    bool need_dst_offset;
    321 
    322    /* Scale factors between the pixel grid and the grid of samples. We're
    323     * using grid of samples for bilinear filetring in multisample scaled blits.
    324     */
    325    float x_scale;
    326    float y_scale;
    327 
    328    /* True for blits with filter = GL_LINEAR. */
    329    bool bilinear_filter;
    330 };
    331 
    332 /**
    333  * \name BLORP internals
    334  * \{
    335  *
    336  * Used internally by gen6_blorp_exec() and gen7_blorp_exec().
    337  */
    338 
    339 void brw_blorp_init_wm_prog_key(struct brw_wm_prog_key *wm_key);
    340 
    341 const unsigned *
    342 blorp_compile_fs(struct blorp_context *blorp, void *mem_ctx,
    343                  struct nir_shader *nir,
    344                  struct brw_wm_prog_key *wm_key,
    345                  bool use_repclear,
    346                  struct brw_wm_prog_data *wm_prog_data);
    347 
    348 const unsigned *
    349 blorp_compile_vs(struct blorp_context *blorp, void *mem_ctx,
    350                  struct nir_shader *nir,
    351                  struct brw_vs_prog_data *vs_prog_data);
    352 
    353 bool
    354 blorp_ensure_sf_program(struct blorp_context *blorp,
    355                         struct blorp_params *params);
    356 
    357 /** \} */
    358 
    359 #ifdef __cplusplus
    360 } /* end extern "C" */
    361 #endif /* __cplusplus */
    362 
    363 #endif /* BLORP_PRIV_H */
    364