Home | History | Annotate | Download | only in nv30
      1 /*
      2  * Copyright 2012 Red Hat Inc.
      3  *
      4  * Permission is hereby granted, free of charge, to any person obtaining a
      5  * copy of this software and associated documentation files (the "Software"),
      6  * to deal in the Software without restriction, including without limitation
      7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
      8  * and/or sell copies of the Software, and to permit persons to whom the
      9  * Software is furnished to do so, subject to the following conditions:
     10  *
     11  * The above copyright notice and this permission notice shall be included in
     12  * all copies or substantial portions of the Software.
     13  *
     14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
     15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
     16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
     17  * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
     18  * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
     19  * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
     20  * SOFTWARE.
     21  *
     22  * Authors: Ben Skeggs
     23  *
     24  */
     25 
     26 #include "util/u_dynarray.h"
     27 #include "tgsi/tgsi_parse.h"
     28 
     29 #include "nouveau/nv_object.xml.h"
     30 #include "nv30-40_3d.xml.h"
     31 #include "nv30_context.h"
     32 #include "nv30_state.h"
     33 
     34 static void
     35 nv30_vertprog_destroy(struct nv30_vertprog *vp)
     36 {
     37    util_dynarray_fini(&vp->branch_relocs);
     38    nouveau_heap_free(&vp->exec);
     39    FREE(vp->insns);
     40    vp->insns = NULL;
     41    vp->nr_insns = 0;
     42 
     43    util_dynarray_fini(&vp->const_relocs);
     44    nouveau_heap_free(&vp->data);
     45    FREE(vp->consts);
     46    vp->consts = NULL;
     47    vp->nr_consts = 0;
     48 
     49    vp->translated = FALSE;
     50 }
     51 
     52 void
     53 nv30_vertprog_validate(struct nv30_context *nv30)
     54 {
     55    struct nouveau_pushbuf *push = nv30->base.pushbuf;
     56    struct nouveau_object *eng3d = nv30->screen->eng3d;
     57    struct nv30_vertprog *vp = nv30->vertprog.program;
     58    struct nv30_fragprog *fp = nv30->fragprog.program;
     59    boolean upload_code = FALSE;
     60    boolean upload_data = FALSE;
     61    unsigned i;
     62 
     63    if (nv30->dirty & NV30_NEW_FRAGPROG) {
     64       if (memcmp(vp->texcoord, fp->texcoord, sizeof(vp->texcoord))) {
     65          if (vp->translated)
     66             nv30_vertprog_destroy(vp);
     67          memcpy(vp->texcoord, fp->texcoord, sizeof(vp->texcoord));
     68       }
     69    }
     70 
     71    if (nv30->rast && nv30->rast->pipe.clip_plane_enable != vp->enabled_ucps) {
     72       vp->enabled_ucps = nv30->rast->pipe.clip_plane_enable;
     73       if (vp->translated)
     74          nv30_vertprog_destroy(vp);
     75    }
     76 
     77    if (!vp->translated) {
     78       vp->translated = _nvfx_vertprog_translate(nv30, vp);
     79       if (!vp->translated) {
     80          nv30->draw_flags |= NV30_NEW_VERTPROG;
     81          return;
     82       }
     83       nv30->dirty |= NV30_NEW_VERTPROG;
     84    }
     85 
     86    if (!vp->exec) {
     87       struct nouveau_heap *heap = nv30->screen->vp_exec_heap;
     88       struct nv30_shader_reloc *reloc = vp->branch_relocs.data;
     89       unsigned nr_reloc = vp->branch_relocs.size / sizeof(*reloc);
     90       uint32_t *inst, target;
     91 
     92       if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
     93          while (heap->next && heap->size < vp->nr_insns) {
     94             struct nouveau_heap **evict = heap->next->priv;
     95             nouveau_heap_free(evict);
     96          }
     97 
     98          if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
     99             nv30->draw_flags |= NV30_NEW_VERTPROG;
    100             return;
    101          }
    102       }
    103 
    104       if (eng3d->oclass < NV40_3D_CLASS) {
    105          while (nr_reloc--) {
    106             inst     = vp->insns[reloc->location].data;
    107             target   = vp->exec->start + reloc->target;
    108 
    109             inst[2] &= ~0x000007fc;
    110             inst[2] |= target << 2;
    111             reloc++;
    112          }
    113       } else {
    114          while (nr_reloc--) {
    115             inst     = vp->insns[reloc->location].data;
    116             target   = vp->exec->start + reloc->target;
    117 
    118             inst[2] &= ~0x0000003f;
    119             inst[2] |= target >> 3;
    120             inst[3] &= ~0xe0000000;
    121             inst[3] |= target << 29;
    122             reloc++;
    123          }
    124       }
    125 
    126       upload_code = TRUE;
    127    }
    128 
    129    if (vp->nr_consts && !vp->data) {
    130       struct nouveau_heap *heap = nv30->screen->vp_data_heap;
    131       struct nv30_shader_reloc *reloc = vp->const_relocs.data;
    132       unsigned nr_reloc = vp->const_relocs.size / sizeof(*reloc);
    133       uint32_t *inst, target;
    134 
    135       if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
    136          while (heap->next && heap->size < vp->nr_consts) {
    137             struct nv30_vertprog *evp = heap->next->priv;
    138             nouveau_heap_free(&evp->data);
    139          }
    140 
    141          if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
    142             nv30->draw_flags |= NV30_NEW_VERTPROG;
    143             return;
    144          }
    145       }
    146 
    147       if (eng3d->oclass < NV40_3D_CLASS) {
    148          while (nr_reloc--) {
    149             inst     = vp->insns[reloc->location].data;
    150             target   = vp->data->start + reloc->target;
    151 
    152             inst[1] &= ~0x0007fc000;
    153             inst[1] |= (target & 0x1ff) << 14;
    154             reloc++;
    155          }
    156       } else {
    157          while (nr_reloc--) {
    158             inst     = vp->insns[reloc->location].data;
    159             target   = vp->data->start + reloc->target;
    160 
    161             inst[1] &= ~0x0001ff000;
    162             inst[1] |= (target & 0x1ff) << 12;
    163             reloc++;
    164          }
    165       }
    166 
    167       upload_code = TRUE;
    168       upload_data = TRUE;
    169    }
    170 
    171    if (vp->nr_consts) {
    172       struct nv04_resource *res = nv04_resource(nv30->vertprog.constbuf);
    173 
    174       for (i = 0; i < vp->nr_consts; i++) {
    175          struct nv30_vertprog_data *data = &vp->consts[i];
    176 
    177          if (data->index < 0) {
    178             if (!upload_data)
    179                continue;
    180          } else {
    181             float *constbuf = (float *)res->data;
    182             if (!upload_data &&
    183                 !memcmp(data->value, &constbuf[data->index * 4], 16))
    184                continue;
    185             memcpy(data->value, &constbuf[data->index * 4], 16);
    186          }
    187 
    188          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_CONST_ID), 5);
    189          PUSH_DATA (push, vp->data->start + i);
    190          PUSH_DATAp(push, data->value, 4);
    191       }
    192    }
    193 
    194    if (upload_code) {
    195       BEGIN_NV04(push, NV30_3D(VP_UPLOAD_FROM_ID), 1);
    196       PUSH_DATA (push, vp->exec->start);
    197       for (i = 0; i < vp->nr_insns; i++) {
    198          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_INST(0)), 4);
    199          PUSH_DATAp(push, vp->insns[i].data, 4);
    200       }
    201    }
    202 
    203    if (nv30->dirty & (NV30_NEW_VERTPROG | NV30_NEW_FRAGPROG)) {
    204       BEGIN_NV04(push, NV30_3D(VP_START_FROM_ID), 1);
    205       PUSH_DATA (push, vp->exec->start);
    206       if (eng3d->oclass < NV40_3D_CLASS) {
    207          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
    208          PUSH_DATA (push, 0x00000013); /* vp instead of ff, somehow */
    209       } else {
    210          BEGIN_NV04(push, NV40_3D(VP_ATTRIB_EN), 2);
    211          PUSH_DATA (push, vp->ir);
    212          PUSH_DATA (push, vp->or | fp->vp_or);
    213          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
    214          PUSH_DATA (push, 0x00000011);
    215       }
    216    }
    217 }
    218 
    219 static void *
    220 nv30_vp_state_create(struct pipe_context *pipe,
    221                      const struct pipe_shader_state *cso)
    222 {
    223    struct nv30_vertprog *vp = CALLOC_STRUCT(nv30_vertprog);
    224    if (!vp)
    225       return NULL;
    226 
    227    vp->pipe.tokens = tgsi_dup_tokens(cso->tokens);
    228    tgsi_scan_shader(vp->pipe.tokens, &vp->info);
    229    return vp;
    230 }
    231 
    232 static void
    233 nv30_vp_state_delete(struct pipe_context *pipe, void *hwcso)
    234 {
    235    struct nv30_vertprog *vp = hwcso;
    236 
    237    if (vp->translated)
    238       nv30_vertprog_destroy(vp);
    239    FREE((void *)vp->pipe.tokens);
    240    FREE(vp);
    241 }
    242 
    243 static void
    244 nv30_vp_state_bind(struct pipe_context *pipe, void *hwcso)
    245 {
    246    struct nv30_context *nv30 = nv30_context(pipe);
    247 
    248    nv30->vertprog.program = hwcso;
    249    nv30->dirty |= NV30_NEW_VERTPROG;
    250 }
    251 
    252 void
    253 nv30_vertprog_init(struct pipe_context *pipe)
    254 {
    255    pipe->create_vs_state = nv30_vp_state_create;
    256    pipe->bind_vs_state = nv30_vp_state_bind;
    257    pipe->delete_vs_state = nv30_vp_state_delete;
    258 }
    259