vertexshader9.c revision 7ec681f3
1/*
2 * Copyright 2011 Joakim Sindholt <opensource@zhasha.com>
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
22
23#include "nine_helpers.h"
24#include "nine_shader.h"
25
26#include "vertexdeclaration9.h"
27#include "vertexshader9.h"
28
29#include "device9.h"
30#include "pipe/p_context.h"
31#include "cso_cache/cso_context.h"
32
33#define DBG_CHANNEL DBG_VERTEXSHADER
34
35HRESULT
36NineVertexShader9_ctor( struct NineVertexShader9 *This,
37                        struct NineUnknownParams *pParams,
38                        const DWORD *pFunction, void *cso )
39{
40    struct NineDevice9 *device;
41    struct nine_shader_info info;
42    struct pipe_context *pipe;
43    HRESULT hr;
44    unsigned i;
45
46    DBG("This=%p pParams=%p pFunction=%p cso=%p\n",
47        This, pParams, pFunction, cso);
48
49    hr = NineUnknown_ctor(&This->base, pParams);
50    if (FAILED(hr))
51        return hr;
52
53    if (cso) {
54        This->ff_cso = cso;
55        return D3D_OK;
56    }
57
58    device = This->base.device;
59
60    info.type = PIPE_SHADER_VERTEX;
61    info.byte_code = pFunction;
62    info.const_i_base = NINE_CONST_I_BASE(device->max_vs_const_f) / 16;
63    info.const_b_base = NINE_CONST_B_BASE(device->max_vs_const_f) / 16;
64    info.sampler_mask_shadow = 0x0;
65    info.fetch4 = 0x0;
66    info.sampler_ps1xtypes = 0x0;
67    info.fog_enable = 0;
68    info.point_size_min = 0;
69    info.point_size_max = 0;
70    info.add_constants_defs.c_combination = NULL;
71    info.add_constants_defs.int_const_added = NULL;
72    info.add_constants_defs.bool_const_added = NULL;
73    info.swvp_on = !!(device->params.BehaviorFlags & D3DCREATE_SOFTWARE_VERTEXPROCESSING);
74    info.process_vertices = false;
75
76    pipe = nine_context_get_pipe_acquire(device);
77    hr = nine_translate_shader(device, &info, pipe);
78    if (hr == D3DERR_INVALIDCALL &&
79        (device->params.BehaviorFlags & D3DCREATE_MIXED_VERTEXPROCESSING)) {
80        /* Retry with a swvp shader. It will require swvp to be on. */
81        info.swvp_on = true;
82        hr = nine_translate_shader(device, &info, pipe);
83    }
84    nine_context_get_pipe_release(device);
85    if (hr == D3DERR_INVALIDCALL)
86        ERR("Encountered buggy shader\n");
87    if (FAILED(hr))
88        return hr;
89    This->byte_code.version = info.version;
90    This->swvp_only = info.swvp_on;
91
92    This->byte_code.tokens = mem_dup(pFunction, info.byte_size);
93    if (!This->byte_code.tokens)
94        return E_OUTOFMEMORY;
95    This->byte_code.size = info.byte_size;
96
97    This->variant.cso = info.cso;
98    This->variant.const_ranges = info.const_ranges;
99    This->variant.const_used_size = info.const_used_size;
100    This->last_cso = info.cso;
101    This->last_const_ranges = info.const_ranges;
102    This->last_const_used_size = info.const_used_size;
103    This->last_key = (uint32_t) (info.swvp_on << 9);
104
105    This->lconstf = info.lconstf;
106    This->sampler_mask = info.sampler_mask;
107    This->position_t = info.position_t;
108    This->point_size = info.point_size;
109
110    memcpy(This->int_slots_used, info.int_slots_used, sizeof(This->int_slots_used));
111    memcpy(This->bool_slots_used, info.bool_slots_used, sizeof(This->bool_slots_used));
112
113    This->const_int_slots = info.const_int_slots;
114    This->const_bool_slots = info.const_bool_slots;
115
116    This->c_combinations = NULL;
117
118    for (i = 0; i < info.num_inputs && i < ARRAY_SIZE(This->input_map); ++i)
119        This->input_map[i].ndecl = info.input_map[i];
120    This->num_inputs = i;
121
122    return D3D_OK;
123}
124
125void
126NineVertexShader9_dtor( struct NineVertexShader9 *This )
127{
128    DBG("This=%p\n", This);
129
130    if (This->base.device) {
131        struct pipe_context *pipe = nine_context_get_pipe_multithread(This->base.device);
132        struct nine_shader_variant *var = &This->variant;
133        struct nine_shader_variant_so *var_so = &This->variant_so;
134
135        do {
136            if (var->cso) {
137                if (This->base.device->context.cso_shader.vs == var->cso)
138                    pipe->bind_vs_state(pipe, NULL);
139                pipe->delete_vs_state(pipe, var->cso);
140                FREE(var->const_ranges);
141            }
142            var = var->next;
143        } while (var);
144
145        while (var_so && var_so->vdecl) {
146            if (var_so->cso) {
147                This->base.device->pipe_sw->delete_vs_state(This->base.device->pipe_sw, var_so->cso);
148            }
149            var_so = var_so->next;
150        }
151
152        if (This->ff_cso) {
153            if (This->ff_cso == This->base.device->context.cso_shader.vs)
154                pipe->bind_vs_state(pipe, NULL);
155            pipe->delete_vs_state(pipe, This->ff_cso);
156        }
157    }
158    nine_shader_variants_free(&This->variant);
159    nine_shader_variants_so_free(&This->variant_so);
160
161    nine_shader_constant_combination_free(This->c_combinations);
162
163    FREE((void *)This->byte_code.tokens); /* const_cast */
164
165    FREE(This->lconstf.data);
166    FREE(This->lconstf.ranges);
167
168    NineUnknown_dtor(&This->base);
169}
170
171HRESULT NINE_WINAPI
172NineVertexShader9_GetFunction( struct NineVertexShader9 *This,
173                               void *pData,
174                               UINT *pSizeOfData )
175{
176    user_assert(pSizeOfData, D3DERR_INVALIDCALL);
177
178    if (!pData) {
179        *pSizeOfData = This->byte_code.size;
180        return D3D_OK;
181    }
182    user_assert(*pSizeOfData >= This->byte_code.size, D3DERR_INVALIDCALL);
183
184    memcpy(pData, This->byte_code.tokens, This->byte_code.size);
185
186    return D3D_OK;
187}
188
189void *
190NineVertexShader9_GetVariant( struct NineVertexShader9 *This,
191                              unsigned **const_ranges,
192                              unsigned *const_used_size )
193{
194    /* GetVariant is called from nine_context, thus we can
195     * get pipe directly */
196    struct pipe_context *pipe = This->base.device->context.pipe;
197    void *cso;
198    uint64_t key;
199
200    key = This->next_key;
201    if (key == This->last_key) {
202        *const_ranges = This->last_const_ranges;
203        *const_used_size = This->last_const_used_size;
204        return This->last_cso;
205    }
206
207    cso = nine_shader_variant_get(&This->variant, const_ranges, const_used_size, key);
208    if (!cso) {
209        struct NineDevice9 *device = This->base.device;
210        struct nine_shader_info info;
211        HRESULT hr;
212
213        info.type = PIPE_SHADER_VERTEX;
214        info.const_i_base = NINE_CONST_I_BASE(device->max_vs_const_f) / 16;
215        info.const_b_base = NINE_CONST_B_BASE(device->max_vs_const_f) / 16;
216        info.byte_code = This->byte_code.tokens;
217        info.sampler_mask_shadow = key & 0xf;
218        info.fetch4 = 0x0;
219        info.fog_enable = device->context.rs[D3DRS_FOGENABLE];
220        info.point_size_min = asfloat(device->context.rs[D3DRS_POINTSIZE_MIN]);
221        info.point_size_max = asfloat(device->context.rs[D3DRS_POINTSIZE_MAX]);
222        info.add_constants_defs.c_combination =
223            nine_shader_constant_combination_get(This->c_combinations, (key >> 16) & 0xff);
224        info.add_constants_defs.int_const_added = &This->int_slots_used;
225        info.add_constants_defs.bool_const_added = &This->bool_slots_used;
226        info.swvp_on = device->context.swvp;
227        info.process_vertices = false;
228
229        hr = nine_translate_shader(This->base.device, &info, pipe);
230        if (FAILED(hr))
231            return NULL;
232        nine_shader_variant_add(&This->variant, key, info.cso,
233                                info.const_ranges, info.const_used_size);
234        cso = info.cso;
235        *const_ranges = info.const_ranges;
236        *const_used_size = info.const_used_size;
237    }
238
239    This->last_key = key;
240    This->last_cso = cso;
241    This->last_const_ranges = *const_ranges;
242    This->last_const_used_size = *const_used_size;
243
244    return cso;
245}
246
247void *
248NineVertexShader9_GetVariantProcessVertices( struct NineVertexShader9 *This,
249                                             struct NineVertexDeclaration9 *vdecl_out,
250                                             struct pipe_stream_output_info *so )
251{
252    struct nine_shader_info info;
253    HRESULT hr;
254    void *cso;
255
256    cso = nine_shader_variant_so_get(&This->variant_so, vdecl_out, so);
257    if (cso)
258        return cso;
259
260    info.type = PIPE_SHADER_VERTEX;
261    info.const_i_base = 0;
262    info.const_b_base = 0;
263    info.byte_code = This->byte_code.tokens;
264    info.sampler_mask_shadow = 0;
265    info.fetch4 = 0x0;
266    info.fog_enable = false;
267    info.point_size_min = 0;
268    info.point_size_max = 0;
269    info.add_constants_defs.c_combination = NULL;
270    info.add_constants_defs.int_const_added = NULL;
271    info.add_constants_defs.bool_const_added = NULL;
272    info.swvp_on = true;
273    info.vdecl_out = vdecl_out;
274    info.process_vertices = true;
275    hr = nine_translate_shader(This->base.device, &info, This->base.device->pipe_sw);
276    if (FAILED(hr))
277        return NULL;
278    *so = info.so;
279    nine_shader_variant_so_add(&This->variant_so, vdecl_out, so, info.cso);
280    return info.cso;
281}
282
283IDirect3DVertexShader9Vtbl NineVertexShader9_vtable = {
284    (void *)NineUnknown_QueryInterface,
285    (void *)NineUnknown_AddRef,
286    (void *)NineUnknown_Release,
287    (void *)NineUnknown_GetDevice,
288    (void *)NineVertexShader9_GetFunction
289};
290
291static const GUID *NineVertexShader9_IIDs[] = {
292    &IID_IDirect3DVertexShader9,
293    &IID_IUnknown,
294    NULL
295};
296
297HRESULT
298NineVertexShader9_new( struct NineDevice9 *pDevice,
299                       struct NineVertexShader9 **ppOut,
300                       const DWORD *pFunction, void *cso )
301{
302    if (cso) {
303        NINE_DEVICE_CHILD_BIND_NEW(VertexShader9, ppOut, pDevice, pFunction, cso);
304    } else {
305        NINE_DEVICE_CHILD_NEW(VertexShader9, ppOut, pDevice, pFunction, cso);
306    }
307}
308