Home | History | Annotate | Download | only in nv30
      1 /*
      2  * Copyright 2012 Red Hat Inc.
      3  *
      4  * Permission is hereby granted, free of charge, to any person obtaining a
      5  * copy of this software and associated documentation files (the "Software"),
      6  * to deal in the Software without restriction, including without limitation
      7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
      8  * and/or sell copies of the Software, and to permit persons to whom the
      9  * Software is furnished to do so, subject to the following conditions:
     10  *
     11  * The above copyright notice and this permission notice shall be included in
     12  * all copies or substantial portions of the Software.
     13  *
     14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
     17  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
     18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
     19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
     20  * OTHER DEALINGS IN THE SOFTWARE.
     21  *
     22  * Authors: Ben Skeggs
     23  *
     24  */
     25 
     26 #include "draw/draw_context.h"
     27 #include "util/u_dynarray.h"
     28 #include "tgsi/tgsi_parse.h"
     29 
     30 #include "nv_object.xml.h"
     31 #include "nv30/nv30-40_3d.xml.h"
     32 #include "nv30/nv30_context.h"
     33 #include "nv30/nvfx_shader.h"
     34 #include "nv30/nv30_state.h"
     35 
     36 static void
     37 nv30_vertprog_destroy(struct nv30_vertprog *vp)
     38 {
     39    util_dynarray_fini(&vp->branch_relocs);
     40    nouveau_heap_free(&vp->exec);
     41    FREE(vp->insns);
     42    vp->insns = NULL;
     43    vp->nr_insns = 0;
     44 
     45    util_dynarray_fini(&vp->const_relocs);
     46    nouveau_heap_free(&vp->data);
     47    FREE(vp->consts);
     48    vp->consts = NULL;
     49    vp->nr_consts = 0;
     50 
     51    vp->translated = false;
     52 }
     53 
     54 void
     55 nv30_vertprog_validate(struct nv30_context *nv30)
     56 {
     57    struct nouveau_pushbuf *push = nv30->base.pushbuf;
     58    struct nouveau_object *eng3d = nv30->screen->eng3d;
     59    struct nv30_vertprog *vp = nv30->vertprog.program;
     60    struct nv30_fragprog *fp = nv30->fragprog.program;
     61    bool upload_code = false;
     62    bool upload_data = false;
     63    unsigned i;
     64 
     65    if (nv30->dirty & NV30_NEW_FRAGPROG) {
     66       if (memcmp(vp->texcoord, fp->texcoord, sizeof(vp->texcoord))) {
     67          if (vp->translated)
     68             nv30_vertprog_destroy(vp);
     69          memcpy(vp->texcoord, fp->texcoord, sizeof(vp->texcoord));
     70       }
     71    }
     72 
     73    if (nv30->rast && nv30->rast->pipe.clip_plane_enable != vp->enabled_ucps) {
     74       vp->enabled_ucps = nv30->rast->pipe.clip_plane_enable;
     75       if (vp->translated)
     76          nv30_vertprog_destroy(vp);
     77    }
     78 
     79    if (!vp->translated) {
     80       vp->translated = _nvfx_vertprog_translate(eng3d->oclass, vp);
     81       if (!vp->translated) {
     82          nv30->draw_flags |= NV30_NEW_VERTPROG;
     83          return;
     84       }
     85       nv30->dirty |= NV30_NEW_VERTPROG;
     86    }
     87 
     88    if (!vp->exec) {
     89       struct nouveau_heap *heap = nv30->screen->vp_exec_heap;
     90       struct nv30_shader_reloc *reloc = vp->branch_relocs.data;
     91       unsigned nr_reloc = vp->branch_relocs.size / sizeof(*reloc);
     92       uint32_t *inst, target;
     93 
     94       if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
     95          while (heap->next && heap->size < vp->nr_insns) {
     96             struct nouveau_heap **evict = heap->next->priv;
     97             nouveau_heap_free(evict);
     98          }
     99 
    100          if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
    101             nv30->draw_flags |= NV30_NEW_VERTPROG;
    102             return;
    103          }
    104       }
    105 
    106       if (eng3d->oclass < NV40_3D_CLASS) {
    107          while (nr_reloc--) {
    108             inst     = vp->insns[reloc->location].data;
    109             target   = vp->exec->start + reloc->target;
    110 
    111             inst[2] &= ~0x000007fc;
    112             inst[2] |= target << 2;
    113             reloc++;
    114          }
    115       } else {
    116          while (nr_reloc--) {
    117             inst     = vp->insns[reloc->location].data;
    118             target   = vp->exec->start + reloc->target;
    119 
    120             inst[2] &= ~0x0000003f;
    121             inst[2] |= target >> 3;
    122             inst[3] &= ~0xe0000000;
    123             inst[3] |= target << 29;
    124             reloc++;
    125          }
    126       }
    127 
    128       upload_code = true;
    129    }
    130 
    131    if (vp->nr_consts && !vp->data) {
    132       struct nouveau_heap *heap = nv30->screen->vp_data_heap;
    133       struct nv30_shader_reloc *reloc = vp->const_relocs.data;
    134       unsigned nr_reloc = vp->const_relocs.size / sizeof(*reloc);
    135       uint32_t *inst, target;
    136 
    137       if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
    138          while (heap->next && heap->size < vp->nr_consts) {
    139             struct nv30_vertprog *evp = heap->next->priv;
    140             nouveau_heap_free(&evp->data);
    141          }
    142 
    143          if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
    144             nv30->draw_flags |= NV30_NEW_VERTPROG;
    145             return;
    146          }
    147       }
    148 
    149       if (eng3d->oclass < NV40_3D_CLASS) {
    150          while (nr_reloc--) {
    151             inst     = vp->insns[reloc->location].data;
    152             target   = vp->data->start + reloc->target;
    153 
    154             inst[1] &= ~0x0007fc000;
    155             inst[1] |= (target & 0x1ff) << 14;
    156             reloc++;
    157          }
    158       } else {
    159          while (nr_reloc--) {
    160             inst     = vp->insns[reloc->location].data;
    161             target   = vp->data->start + reloc->target;
    162 
    163             inst[1] &= ~0x0001ff000;
    164             inst[1] |= (target & 0x1ff) << 12;
    165             reloc++;
    166          }
    167       }
    168 
    169       upload_code = true;
    170       upload_data = true;
    171    }
    172 
    173    if (vp->nr_consts) {
    174       struct nv04_resource *res = nv04_resource(nv30->vertprog.constbuf);
    175 
    176       for (i = 0; i < vp->nr_consts; i++) {
    177          struct nv30_vertprog_data *data = &vp->consts[i];
    178 
    179          if (data->index < 0) {
    180             if (!upload_data)
    181                continue;
    182          } else {
    183             float *constbuf = (float *)res->data;
    184             if (!upload_data &&
    185                 !memcmp(data->value, &constbuf[data->index * 4], 16))
    186                continue;
    187             memcpy(data->value, &constbuf[data->index * 4], 16);
    188          }
    189 
    190          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_CONST_ID), 5);
    191          PUSH_DATA (push, vp->data->start + i);
    192          PUSH_DATAp(push, data->value, 4);
    193       }
    194    }
    195 
    196    if (upload_code) {
    197       BEGIN_NV04(push, NV30_3D(VP_UPLOAD_FROM_ID), 1);
    198       PUSH_DATA (push, vp->exec->start);
    199       for (i = 0; i < vp->nr_insns; i++) {
    200          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_INST(0)), 4);
    201          PUSH_DATAp(push, vp->insns[i].data, 4);
    202       }
    203    }
    204 
    205    if (nv30->dirty & (NV30_NEW_VERTPROG | NV30_NEW_FRAGPROG)) {
    206       BEGIN_NV04(push, NV30_3D(VP_START_FROM_ID), 1);
    207       PUSH_DATA (push, vp->exec->start);
    208       if (eng3d->oclass < NV40_3D_CLASS) {
    209          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
    210          PUSH_DATA (push, 0x00000013); /* vp instead of ff, somehow */
    211       } else {
    212          BEGIN_NV04(push, NV40_3D(VP_ATTRIB_EN), 2);
    213          PUSH_DATA (push, vp->ir);
    214          PUSH_DATA (push, vp->or | fp->vp_or);
    215          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
    216          PUSH_DATA (push, 0x00000011);
    217       }
    218    }
    219 }
    220 
    221 static void *
    222 nv30_vp_state_create(struct pipe_context *pipe,
    223                      const struct pipe_shader_state *cso)
    224 {
    225    struct nv30_vertprog *vp = CALLOC_STRUCT(nv30_vertprog);
    226    if (!vp)
    227       return NULL;
    228 
    229    vp->pipe.tokens = tgsi_dup_tokens(cso->tokens);
    230    tgsi_scan_shader(vp->pipe.tokens, &vp->info);
    231    return vp;
    232 }
    233 
    234 static void
    235 nv30_vp_state_delete(struct pipe_context *pipe, void *hwcso)
    236 {
    237    struct nv30_vertprog *vp = hwcso;
    238 
    239    if (vp->translated)
    240       nv30_vertprog_destroy(vp);
    241 
    242    if (vp->draw)
    243       draw_delete_vertex_shader(nv30_context(pipe)->draw, vp->draw);
    244 
    245    FREE((void *)vp->pipe.tokens);
    246    FREE(vp);
    247 }
    248 
    249 static void
    250 nv30_vp_state_bind(struct pipe_context *pipe, void *hwcso)
    251 {
    252    struct nv30_context *nv30 = nv30_context(pipe);
    253 
    254    nv30->vertprog.program = hwcso;
    255    nv30->dirty |= NV30_NEW_VERTPROG;
    256 }
    257 
    258 void
    259 nv30_vertprog_init(struct pipe_context *pipe)
    260 {
    261    pipe->create_vs_state = nv30_vp_state_create;
    262    pipe->bind_vs_state = nv30_vp_state_bind;
    263    pipe->delete_vs_state = nv30_vp_state_delete;
    264 }
    265