1 /*
2  * Copyright 2012 Red Hat Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
18  * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF
19  * OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
20  * SOFTWARE.
21  *
22  * Authors: Ben Skeggs
23  *
24  */
25 
26 #include "util/u_dynarray.h"
27 #include "tgsi/tgsi_parse.h"
28 
29 #include "nouveau/nv_object.xml.h"
30 #include "nv30-40_3d.xml.h"
31 #include "nv30_context.h"
32 #include "nv30_state.h"
33 
34 static void
nv30_vertprog_destroy(struct nv30_vertprog * vp)35 nv30_vertprog_destroy(struct nv30_vertprog *vp)
36 {
37    util_dynarray_fini(&vp->branch_relocs);
38    nouveau_heap_free(&vp->exec);
39    FREE(vp->insns);
40    vp->insns = NULL;
41    vp->nr_insns = 0;
42 
43    util_dynarray_fini(&vp->const_relocs);
44    nouveau_heap_free(&vp->data);
45    FREE(vp->consts);
46    vp->consts = NULL;
47    vp->nr_consts = 0;
48 
49    vp->translated = FALSE;
50 }
51 
52 void
nv30_vertprog_validate(struct nv30_context * nv30)53 nv30_vertprog_validate(struct nv30_context *nv30)
54 {
55    struct nouveau_pushbuf *push = nv30->base.pushbuf;
56    struct nouveau_object *eng3d = nv30->screen->eng3d;
57    struct nv30_vertprog *vp = nv30->vertprog.program;
58    struct nv30_fragprog *fp = nv30->fragprog.program;
59    boolean upload_code = FALSE;
60    boolean upload_data = FALSE;
61    unsigned i;
62 
63    if (nv30->dirty & NV30_NEW_FRAGPROG) {
64       if (memcmp(vp->texcoord, fp->texcoord, sizeof(vp->texcoord))) {
65          if (vp->translated)
66             nv30_vertprog_destroy(vp);
67          memcpy(vp->texcoord, fp->texcoord, sizeof(vp->texcoord));
68       }
69    }
70 
71    if (nv30->rast && nv30->rast->pipe.clip_plane_enable != vp->enabled_ucps) {
72       vp->enabled_ucps = nv30->rast->pipe.clip_plane_enable;
73       if (vp->translated)
74          nv30_vertprog_destroy(vp);
75    }
76 
77    if (!vp->translated) {
78       vp->translated = _nvfx_vertprog_translate(nv30, vp);
79       if (!vp->translated) {
80          nv30->draw_flags |= NV30_NEW_VERTPROG;
81          return;
82       }
83       nv30->dirty |= NV30_NEW_VERTPROG;
84    }
85 
86    if (!vp->exec) {
87       struct nouveau_heap *heap = nv30->screen->vp_exec_heap;
88       struct nv30_shader_reloc *reloc = vp->branch_relocs.data;
89       unsigned nr_reloc = vp->branch_relocs.size / sizeof(*reloc);
90       uint32_t *inst, target;
91 
92       if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
93          while (heap->next && heap->size < vp->nr_insns) {
94             struct nouveau_heap **evict = heap->next->priv;
95             nouveau_heap_free(evict);
96          }
97 
98          if (nouveau_heap_alloc(heap, vp->nr_insns, &vp->exec, &vp->exec)) {
99             nv30->draw_flags |= NV30_NEW_VERTPROG;
100             return;
101          }
102       }
103 
104       if (eng3d->oclass < NV40_3D_CLASS) {
105          while (nr_reloc--) {
106             inst     = vp->insns[reloc->location].data;
107             target   = vp->exec->start + reloc->target;
108 
109             inst[2] &= ~0x000007fc;
110             inst[2] |= target << 2;
111             reloc++;
112          }
113       } else {
114          while (nr_reloc--) {
115             inst     = vp->insns[reloc->location].data;
116             target   = vp->exec->start + reloc->target;
117 
118             inst[2] &= ~0x0000003f;
119             inst[2] |= target >> 3;
120             inst[3] &= ~0xe0000000;
121             inst[3] |= target << 29;
122             reloc++;
123          }
124       }
125 
126       upload_code = TRUE;
127    }
128 
129    if (vp->nr_consts && !vp->data) {
130       struct nouveau_heap *heap = nv30->screen->vp_data_heap;
131       struct nv30_shader_reloc *reloc = vp->const_relocs.data;
132       unsigned nr_reloc = vp->const_relocs.size / sizeof(*reloc);
133       uint32_t *inst, target;
134 
135       if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
136          while (heap->next && heap->size < vp->nr_consts) {
137             struct nv30_vertprog *evp = heap->next->priv;
138             nouveau_heap_free(&evp->data);
139          }
140 
141          if (nouveau_heap_alloc(heap, vp->nr_consts, vp, &vp->data)) {
142             nv30->draw_flags |= NV30_NEW_VERTPROG;
143             return;
144          }
145       }
146 
147       if (eng3d->oclass < NV40_3D_CLASS) {
148          while (nr_reloc--) {
149             inst     = vp->insns[reloc->location].data;
150             target   = vp->data->start + reloc->target;
151 
152             inst[1] &= ~0x0007fc000;
153             inst[1] |= (target & 0x1ff) << 14;
154             reloc++;
155          }
156       } else {
157          while (nr_reloc--) {
158             inst     = vp->insns[reloc->location].data;
159             target   = vp->data->start + reloc->target;
160 
161             inst[1] &= ~0x0001ff000;
162             inst[1] |= (target & 0x1ff) << 12;
163             reloc++;
164          }
165       }
166 
167       upload_code = TRUE;
168       upload_data = TRUE;
169    }
170 
171    if (vp->nr_consts) {
172       struct nv04_resource *res = nv04_resource(nv30->vertprog.constbuf);
173 
174       for (i = 0; i < vp->nr_consts; i++) {
175          struct nv30_vertprog_data *data = &vp->consts[i];
176 
177          if (data->index < 0) {
178             if (!upload_data)
179                continue;
180          } else {
181             float *constbuf = (float *)res->data;
182             if (!upload_data &&
183                 !memcmp(data->value, &constbuf[data->index * 4], 16))
184                continue;
185             memcpy(data->value, &constbuf[data->index * 4], 16);
186          }
187 
188          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_CONST_ID), 5);
189          PUSH_DATA (push, vp->data->start + i);
190          PUSH_DATAp(push, data->value, 4);
191       }
192    }
193 
194    if (upload_code) {
195       BEGIN_NV04(push, NV30_3D(VP_UPLOAD_FROM_ID), 1);
196       PUSH_DATA (push, vp->exec->start);
197       for (i = 0; i < vp->nr_insns; i++) {
198          BEGIN_NV04(push, NV30_3D(VP_UPLOAD_INST(0)), 4);
199          PUSH_DATAp(push, vp->insns[i].data, 4);
200       }
201    }
202 
203    if (nv30->dirty & (NV30_NEW_VERTPROG | NV30_NEW_FRAGPROG)) {
204       BEGIN_NV04(push, NV30_3D(VP_START_FROM_ID), 1);
205       PUSH_DATA (push, vp->exec->start);
206       if (eng3d->oclass < NV40_3D_CLASS) {
207          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
208          PUSH_DATA (push, 0x00000013); /* vp instead of ff, somehow */
209       } else {
210          BEGIN_NV04(push, NV40_3D(VP_ATTRIB_EN), 2);
211          PUSH_DATA (push, vp->ir);
212          PUSH_DATA (push, vp->or | fp->vp_or);
213          BEGIN_NV04(push, NV30_3D(ENGINE), 1);
214          PUSH_DATA (push, 0x00000011);
215       }
216    }
217 }
218 
219 static void *
nv30_vp_state_create(struct pipe_context * pipe,const struct pipe_shader_state * cso)220 nv30_vp_state_create(struct pipe_context *pipe,
221                      const struct pipe_shader_state *cso)
222 {
223    struct nv30_vertprog *vp = CALLOC_STRUCT(nv30_vertprog);
224    if (!vp)
225       return NULL;
226 
227    vp->pipe.tokens = tgsi_dup_tokens(cso->tokens);
228    tgsi_scan_shader(vp->pipe.tokens, &vp->info);
229    return vp;
230 }
231 
232 static void
nv30_vp_state_delete(struct pipe_context * pipe,void * hwcso)233 nv30_vp_state_delete(struct pipe_context *pipe, void *hwcso)
234 {
235    struct nv30_vertprog *vp = hwcso;
236 
237    if (vp->translated)
238       nv30_vertprog_destroy(vp);
239    FREE((void *)vp->pipe.tokens);
240    FREE(vp);
241 }
242 
243 static void
nv30_vp_state_bind(struct pipe_context * pipe,void * hwcso)244 nv30_vp_state_bind(struct pipe_context *pipe, void *hwcso)
245 {
246    struct nv30_context *nv30 = nv30_context(pipe);
247 
248    nv30->vertprog.program = hwcso;
249    nv30->dirty |= NV30_NEW_VERTPROG;
250 }
251 
252 void
nv30_vertprog_init(struct pipe_context * pipe)253 nv30_vertprog_init(struct pipe_context *pipe)
254 {
255    pipe->create_vs_state = nv30_vp_state_create;
256    pipe->bind_vs_state = nv30_vp_state_bind;
257    pipe->delete_vs_state = nv30_vp_state_delete;
258 }
259