1 /*
2  * Copyright 2011 Joakim Sindholt <opensource@zhasha.com>
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * on the rights to use, copy, modify, merge, publish, distribute, sub
8  * license, and/or sell copies of the Software, and to permit persons to whom
9  * the Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18  * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21  * USE OR OTHER DEALINGS IN THE SOFTWARE. */
22 
23 #ifndef _NINE_PIXELSHADER9_H_
24 #define _NINE_PIXELSHADER9_H_
25 
26 #include "iunknown.h"
27 #include "nine_shader.h"
28 #include "nine_state.h"
29 #include "basetexture9.h"
30 #include "nine_ff.h"
31 #include "surface9.h"
32 
33 struct nine_lconstf;
34 
35 struct NinePixelShader9
36 {
37     struct NineUnknown base;
38     struct nine_shader_variant variant;
39 
40     struct {
41         const DWORD *tokens;
42         DWORD size;
43         uint8_t version; /* (major << 4) | minor */
44     } byte_code;
45 
46     uint8_t bumpenvmat_needed;
47     uint16_t sampler_mask;
48     uint8_t rt_mask;
49 
50     boolean int_slots_used[NINE_MAX_CONST_I];
51     boolean bool_slots_used[NINE_MAX_CONST_B];
52 
53     unsigned const_int_slots;
54     unsigned const_bool_slots;
55 
56     struct nine_shader_constant_combination *c_combinations;
57 
58     uint64_t ff_key[6];
59     void *ff_cso;
60 
61     uint64_t last_key;
62     void *last_cso;
63     unsigned *last_const_ranges;
64     unsigned last_const_used_size; /* in bytes */
65 
66     uint64_t next_key;
67 };
68 static inline struct NinePixelShader9 *
NinePixelShader9(void * data)69 NinePixelShader9( void *data )
70 {
71     return (struct NinePixelShader9 *)data;
72 }
73 
74 static inline BOOL
NinePixelShader9_UpdateKey(struct NinePixelShader9 * ps,struct nine_context * context)75 NinePixelShader9_UpdateKey( struct NinePixelShader9 *ps,
76                             struct nine_context *context )
77 {
78     uint16_t samplers_shadow;
79     uint16_t samplers_ps1_types;
80     uint8_t projected;
81     uint64_t key;
82     BOOL res;
83 
84     samplers_shadow = (uint16_t)((context->samplers_shadow & NINE_PS_SAMPLERS_MASK) >> NINE_SAMPLER_PS(0));
85     key = samplers_shadow & ps->sampler_mask;
86 
87     if (unlikely(ps->byte_code.version < 0x20)) {
88         /* variable targets */
89         uint32_t m = ps->sampler_mask;
90         samplers_ps1_types = 0;
91         while (m) {
92             int s = ffs(m) - 1;
93             m &= ~(1 << s);
94             samplers_ps1_types |= (context->texture[s].enabled ? context->texture[s].pstype : 1) << (s * 2);
95         }
96         /* Note: For ps 1.X, only samplers 0 1 2 and 3 are available (except 1.4 where 4 and 5 are available).
97          * ps < 1.4: samplers_shadow 4b, samplers_ps1_types 8b, projected 8b
98          * ps 1.4: samplers_shadow 6b, samplers_ps1_types 12b
99          * Tot ps X.X samplers_shadow + extra: 20b */
100         assert((ps->byte_code.version < 0x14 && !(ps->sampler_mask & 0xFFF0)) || !(ps->sampler_mask & 0xFFC0));
101 
102         if (unlikely(ps->byte_code.version < 0x14)) {
103             key |= samplers_ps1_types << 4;
104             projected = nine_ff_get_projected_key_programmable(context);
105             key |= ((uint64_t) projected) << 12;
106         } else {
107             key |= samplers_ps1_types << 6;
108         }
109     }
110 
111     if (ps->byte_code.version < 0x30) {
112         key |= ((uint64_t)context->rs[D3DRS_FOGENABLE]) << 20;
113         key |= ((uint64_t)context->rs[D3DRS_FOGTABLEMODE]) << 21;
114     }
115 
116     /* centroid interpolation automatically used for color ps inputs */
117     if (context->rt[0]->base.info.nr_samples)
118         key |= ((uint64_t)1) << 22;
119 
120     if ((ps->const_int_slots > 0 || ps->const_bool_slots > 0) && context->inline_constants)
121         key |= ((uint64_t)nine_shader_constant_combination_key(&ps->c_combinations,
122                                                                ps->int_slots_used,
123                                                                ps->bool_slots_used,
124                                                                (void *)context->ps_const_i,
125                                                                context->ps_const_b)) << 24;
126 
127     res = ps->last_key != key;
128     if (res)
129         ps->next_key = key;
130     return res;
131 }
132 
133 void *
134 NinePixelShader9_GetVariant( struct NinePixelShader9 *ps,
135                              unsigned **const_ranges,
136                              unsigned *const_used_size );
137 
138 /*** public ***/
139 
140 HRESULT
141 NinePixelShader9_new( struct NineDevice9 *pDevice,
142                       struct NinePixelShader9 **ppOut,
143                       const DWORD *pFunction, void *cso );
144 
145 HRESULT
146 NinePixelShader9_ctor( struct NinePixelShader9 *,
147                        struct NineUnknownParams *pParams,
148                        const DWORD *pFunction, void *cso );
149 
150 void
151 NinePixelShader9_dtor( struct NinePixelShader9 * );
152 
153 HRESULT NINE_WINAPI
154 NinePixelShader9_GetFunction( struct NinePixelShader9 *This,
155                               void *pData,
156                               UINT *pSizeOfData );
157 
158 #endif /* _NINE_PIXELSHADER9_H_ */
159