Subversion Repositories Kolibri OS

Rev

Blame | Last modification | View Log | RSS feed

  1. /*
  2.  * Copyright 2012 Red Hat Inc.
  3.  *
  4.  * Permission is hereby granted, free of charge, to any person obtaining a
  5.  * copy of this software and associated documentation files (the "Software"),
  6.  * to deal in the Software without restriction, including without limitation
  7.  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8.  * and/or sell copies of the Software, and to permit persons to whom the
  9.  * Software is furnished to do so, subject to the following conditions:
  10.  *
  11.  * The above copyright notice and this permission notice shall be included in
  12.  * all copies or substantial portions of the Software.
  13.  *
  14.  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15.  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16.  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
  17.  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
  18.  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
  19.  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
  20.  * OTHER DEALINGS IN THE SOFTWARE.
  21.  *
  22.  * Authors: Ben Skeggs
  23.  *
  24.  */
  25.  
  26. #include "draw/draw_context.h"
  27. #include "util/u_dynarray.h"
  28. #include "tgsi/tgsi_parse.h"
  29.  
  30. #include "nv_object.xml.h"
  31. #include "nv30/nv30-40_3d.xml.h"
  32. #include "nv30/nv30_context.h"
  33. #include "nv30/nvfx_shader.h"
  34. #include "nv30/nv30_state.h"
  35.  
  36. static void
  37. nv30_vertprog_destroy(struct nv30_vertprog *vp)
  38. {
  39.    util_dynarray_fini(&vp->branch_relocs);
  40.    nouveau_heap_free(&vp->exec);
  41.    FREE(vp->insns);
  42.    vp->insns = NULL;
  43.    vp->nr_insns = 0;
  44.  
  45.    util_dynarray_fini(&vp->const_relocs);
  46.    nouveau_heap_free(&vp->data);
  47.    FREE(vp->consts);
  48.    vp->consts = NULL;
  49.    vp->nr_consts = 0;
  50.  
  51.    vp->translated = FALSE;
  52. }
  53.  
  54. void
  55. nv30_vertprog_validate(struct nv30_context *nv30)
  56. {
  57.    struct nouveau_pushbuf *push = nv30->base.pushbuf;
  58.    struct nouveau_object *eng3d = nv30->screen->eng3d;
  59.    struct nv30_vertprog *vp = nv30->vertprog.program;
  60.    struct nv30_fragprog *fp = nv30->fragprog.program;
  61.    boolean upload_code = FALSE;
  62.    boolean upload_data = FALSE;
  63.    unsigned i;
  64.  
  65.    if (nv30->dirty & NV30_NEW_FRAGPROG) {
  66.       if (memcmp(vp->texcoord, fp->texcoord, sizeof(vp->texcoord))) {
  67.          if (vp->translated)
  68.             nv30_vertprog_destroy(vp);
  69.          memcpy(vp->texcoord, fp->texcoord, sizeof(vp->texcoord));
  70.       }
  71.    }
  72.  
  73.    if (nv30->rast && nv30->rast->pipe.clip_plane_enable != vp->enabled_ucps) {
  74.       vp->enabled_ucps = nv30->rast->pipe.clip_plane_enable;
  75.       if (vp->translated)
  76.          nv30_vertprog_destroy(vp);
  77.    }
  78.  
  79.    if (!vp->translated) {
  80.       vp->translated = _nvfx_vertprog_translate(eng3d->oclass, vp);
  81.       if (!vp->translated) {
  82.          nv30->draw_flags |= NV30_NEW_VERTPROG;
  83.          return;
  84.       }
  85.       nv30->dirty |= NV30_NEW_VERTPROG;
  86.    }
  87.  
  88.    if (!vp->exec) {
  89.       struct nouveau_heap *heap = nv30->screen->vp_exec_heap;
  90.       struct nv30_shader_reloc *reloc = vp->branch_relocs.data;
  91.       unsigned nr_reloc = vp->branch_relocs.size / sizeof(*reloc);
  92.       uint32_t *inst, target;
  93.  
  94.       if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
  95.          while (heap->next && heap->size < vp->nr_insns) {
  96.             struct nouveau_heap **evict = heap->next->priv;
  97.             nouveau_heap_free(evict);
  98.          }
  99.  
  100.          if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
  101.             nv30->draw_flags |= NV30_NEW_VERTPROG;
  102.             return;
  103.          }
  104.       }
  105.  
  106.       if (eng3d->oclass < NV40_3D_CLASS) {
  107.          while (nr_reloc--) {
  108.             inst     = vp->insns[reloc->location].data;
  109.             target   = vp->exec->start + reloc->target;
  110.  
  111.             inst[2] &= ~0x000007fc;
  112.             inst[2] |= target << 2;
  113.             reloc++;
  114.          }
  115.       } else {
  116.          while (nr_reloc--) {
  117.             inst     = vp->insns[reloc->location].data;
  118.             target   = vp->exec->start + reloc->target;
  119.  
  120.             inst[2] &= ~0x0000003f;
  121.             inst[2] |= target >> 3;
  122.             inst[3] &= ~0xe0000000;
  123.             inst[3] |= target << 29;
  124.             reloc++;
  125.          }
  126.       }
  127.  
  128.       upload_code = TRUE;
  129.    }
  130.  
  131.    if (vp->nr_consts && !vp->data) {
  132.       struct nouveau_heap *heap = nv30->screen->vp_data_heap;
  133.       struct nv30_shader_reloc *reloc = vp->const_relocs.data;
  134.       unsigned nr_reloc = vp->const_relocs.size / sizeof(*reloc);
  135.       uint32_t *inst, target;
  136.  
  137.       if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
  138.          while (heap->next && heap->size < vp->nr_consts) {
  139.             struct nv30_vertprog *evp = heap->next->priv;
  140.             nouveau_heap_free(&evp->data);
  141.          }
  142.  
  143.          if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
  144.             nv30->draw_flags |= NV30_NEW_VERTPROG;
  145.             return;
  146.          }
  147.       }
  148.  
  149.       if (eng3d->oclass < NV40_3D_CLASS) {
  150.          while (nr_reloc--) {
  151.             inst     = vp->insns[reloc->location].data;
  152.             target   = vp->data->start + reloc->target;
  153.  
  154.             inst[1] &= ~0x0007fc000;
  155.             inst[1] |= (target & 0x1ff) << 14;
  156.             reloc++;
  157.          }
  158.       } else {
  159.          while (nr_reloc--) {
  160.             inst     = vp->insns[reloc->location].data;
  161.             target   = vp->data->start + reloc->target;
  162.  
  163.             inst[1] &= ~0x0001ff000;
  164.             inst[1] |= (target & 0x1ff) << 12;
  165.             reloc++;
  166.          }
  167.       }
  168.  
  169.       upload_code = TRUE;
  170.       upload_data = TRUE;
  171.    }
  172.  
  173.    if (vp->nr_consts) {
  174.       struct nv04_resource *res = nv04_resource(nv30->vertprog.constbuf);
  175.  
  176.       for (i = 0; i < vp->nr_consts; i++) {
  177.          struct nv30_vertprog_data *data = &vp->consts[i];
  178.  
  179.          if (data->index < 0) {
  180.             if (!upload_data)
  181.                continue;
  182.          } else {
  183.             float *constbuf = (float *)res->data;
  184.             if (!upload_data &&
  185.                 !memcmp(data->value, &constbuf[data->index * 4], 16))
  186.                continue;
  187.             memcpy(data->value, &constbuf[data->index * 4], 16);
  188.          }
  189.  
  190.          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_CONST_ID), 5);
  191.          PUSH_DATA (push, vp->data->start + i);
  192.          PUSH_DATAp(push, data->value, 4);
  193.       }
  194.    }
  195.  
  196.    if (upload_code) {
  197.       BEGIN_NV04(push, NV30_3D(VP_UPLOAD_FROM_ID), 1);
  198.       PUSH_DATA (push, vp->exec->start);
  199.       for (i = 0; i < vp->nr_insns; i++) {
  200.          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_INST(0)), 4);
  201.          PUSH_DATAp(push, vp->insns[i].data, 4);
  202.       }
  203.    }
  204.  
  205.    if (nv30->dirty & (NV30_NEW_VERTPROG | NV30_NEW_FRAGPROG)) {
  206.       BEGIN_NV04(push, NV30_3D(VP_START_FROM_ID), 1);
  207.       PUSH_DATA (push, vp->exec->start);
  208.       if (eng3d->oclass < NV40_3D_CLASS) {
  209.          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
  210.          PUSH_DATA (push, 0x00000013); /* vp instead of ff, somehow */
  211.       } else {
  212.          BEGIN_NV04(push, NV40_3D(VP_ATTRIB_EN), 2);
  213.          PUSH_DATA (push, vp->ir);
  214.          PUSH_DATA (push, vp->or | fp->vp_or);
  215.          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
  216.          PUSH_DATA (push, 0x00000011);
  217.       }
  218.    }
  219. }
  220.  
  221. static void *
  222. nv30_vp_state_create(struct pipe_context *pipe,
  223.                      const struct pipe_shader_state *cso)
  224. {
  225.    struct nv30_vertprog *vp = CALLOC_STRUCT(nv30_vertprog);
  226.    if (!vp)
  227.       return NULL;
  228.  
  229.    vp->pipe.tokens = tgsi_dup_tokens(cso->tokens);
  230.    tgsi_scan_shader(vp->pipe.tokens, &vp->info);
  231.    return vp;
  232. }
  233.  
  234. static void
  235. nv30_vp_state_delete(struct pipe_context *pipe, void *hwcso)
  236. {
  237.    struct nv30_vertprog *vp = hwcso;
  238.  
  239.    if (vp->translated)
  240.       nv30_vertprog_destroy(vp);
  241.  
  242.    if (vp->draw)
  243.       draw_delete_vertex_shader(nv30_context(pipe)->draw, vp->draw);
  244.  
  245.    FREE((void *)vp->pipe.tokens);
  246.    FREE(vp);
  247. }
  248.  
  249. static void
  250. nv30_vp_state_bind(struct pipe_context *pipe, void *hwcso)
  251. {
  252.    struct nv30_context *nv30 = nv30_context(pipe);
  253.  
  254.    nv30->vertprog.program = hwcso;
  255.    nv30->dirty |= NV30_NEW_VERTPROG;
  256. }
  257.  
  258. void
  259. nv30_vertprog_init(struct pipe_context *pipe)
  260. {
  261.    pipe->create_vs_state = nv30_vp_state_create;
  262.    pipe->bind_vs_state = nv30_vp_state_bind;
  263.    pipe->delete_vs_state = nv30_vp_state_delete;
  264. }
  265.