jscript: Added VBArray.dimensions() implementation.
[wine] / dlls / wined3d / shader_sm4.c
1 /*
2  * Copyright 2009 Henri Verbeet for CodeWeavers
3  *
4  * This library is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * This library is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with this library; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
17  */
18
19 #include "config.h"
20 #include "wine/port.h"
21
22 #include "wined3d_private.h"
23
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
25
26 #define WINED3D_SM4_INSTRUCTION_MODIFIER        (1 << 31)
27
28 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT    24
29 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK     (0xf << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
30
31 #define WINED3D_SM4_OPCODE_MASK                 0xff
32
33 #define WINED3D_SM4_REGISTER_MODIFIER           (1 << 31)
34
35 #define WINED3D_SM4_REGISTER_ORDER_SHIFT        20
36 #define WINED3D_SM4_REGISTER_ORDER_MASK         (0x3 << WINED3D_SM4_REGISTER_ORDER_SHIFT)
37
38 #define WINED3D_SM4_REGISTER_TYPE_SHIFT         12
39 #define WINED3D_SM4_REGISTER_TYPE_MASK          (0xf << WINED3D_SM4_REGISTER_TYPE_SHIFT)
40
41 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT         0
42 #define WINED3D_SM4_IMMCONST_TYPE_MASK          (0x3 << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
43
44 #define WINED3D_SM4_WRITEMASK_SHIFT             4
45 #define WINED3D_SM4_WRITEMASK_MASK              (0xf << WINED3D_SM4_WRITEMASK_SHIFT)
46
47 #define WINED3D_SM4_SWIZZLE_SHIFT               4
48 #define WINED3D_SM4_SWIZZLE_MASK                (0xff << WINED3D_SM4_SWIZZLE_SHIFT)
49
50 #define WINED3D_SM4_VERSION_MAJOR(version)      (((version) >> 4) & 0xf)
51 #define WINED3D_SM4_VERSION_MINOR(version)      (((version) >> 0) & 0xf)
52
53 enum wined3d_sm4_opcode
54 {
55     WINED3D_SM4_OP_ADD          = 0x00,
56     WINED3D_SM4_OP_AND          = 0x01,
57     WINED3D_SM4_OP_BREAK        = 0x02,
58     WINED3D_SM4_OP_BREAKC       = 0x03,
59     WINED3D_SM4_OP_CUT          = 0x09,
60     WINED3D_SM4_OP_DIV          = 0x0e,
61     WINED3D_SM4_OP_DP3          = 0x10,
62     WINED3D_SM4_OP_DP4          = 0x11,
63     WINED3D_SM4_OP_EMIT         = 0x13,
64     WINED3D_SM4_OP_ENDIF        = 0x15,
65     WINED3D_SM4_OP_ENDLOOP      = 0x16,
66     WINED3D_SM4_OP_EXP          = 0x19,
67     WINED3D_SM4_OP_FRC          = 0x1a,
68     WINED3D_SM4_OP_FTOI         = 0x1b,
69     WINED3D_SM4_OP_IADD         = 0x1e,
70     WINED3D_SM4_OP_IF           = 0x1f,
71     WINED3D_SM4_OP_IEQ          = 0x20,
72     WINED3D_SM4_OP_IGE          = 0x21,
73     WINED3D_SM4_OP_IMUL         = 0x26,
74     WINED3D_SM4_OP_ITOF         = 0x2b,
75     WINED3D_SM4_OP_LD           = 0x2d,
76     WINED3D_SM4_OP_LOG          = 0x2f,
77     WINED3D_SM4_OP_LOOP         = 0x30,
78     WINED3D_SM4_OP_LT           = 0x31,
79     WINED3D_SM4_OP_MAD          = 0x32,
80     WINED3D_SM4_OP_MIN          = 0x33,
81     WINED3D_SM4_OP_MAX          = 0x34,
82     WINED3D_SM4_OP_MOV          = 0x36,
83     WINED3D_SM4_OP_MOVC         = 0x37,
84     WINED3D_SM4_OP_MUL          = 0x38,
85     WINED3D_SM4_OP_RET          = 0x3e,
86     WINED3D_SM4_OP_RSQ          = 0x44,
87     WINED3D_SM4_OP_SAMPLE       = 0x45,
88     WINED3D_SM4_OP_SAMPLE_LOD   = 0x48,
89     WINED3D_SM4_OP_SAMPLE_GRAD  = 0x49,
90     WINED3D_SM4_OP_SINCOS       = 0x4d,
91     WINED3D_SM4_OP_UTOF         = 0x56,
92 };
93
94 enum wined3d_sm4_register_type
95 {
96     WINED3D_SM4_RT_TEMP         = 0x0,
97     WINED3D_SM4_RT_INPUT        = 0x1,
98     WINED3D_SM4_RT_OUTPUT       = 0x2,
99     WINED3D_SM4_RT_IMMCONST     = 0x4,
100     WINED3D_SM4_RT_SAMPLER      = 0x6,
101     WINED3D_SM4_RT_CONSTBUFFER  = 0x8,
102     WINED3D_SM4_RT_NULL         = 0xd,
103 };
104
105 enum wined3d_sm4_immconst_type
106 {
107     WINED3D_SM4_IMMCONST_SCALAR = 0x1,
108     WINED3D_SM4_IMMCONST_VEC4   = 0x2,
109 };
110
111 struct wined3d_sm4_data
112 {
113     struct wined3d_shader_version shader_version;
114     const DWORD *end;
115     const struct wined3d_shader_signature *output_signature;
116 };
117
118 struct wined3d_sm4_opcode_info
119 {
120     enum wined3d_sm4_opcode opcode;
121     enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
122     UINT dst_count;
123     UINT src_count;
124 };
125
126 struct sysval_map
127 {
128     enum wined3d_sysval_semantic sysval;
129     WINED3DSHADER_PARAM_REGISTER_TYPE register_type;
130     UINT register_idx;
131 };
132
133 static const struct wined3d_sm4_opcode_info opcode_table[] =
134 {
135     {WINED3D_SM4_OP_ADD,        WINED3DSIH_ADD,         1,  2},
136     {WINED3D_SM4_OP_AND,        WINED3DSIH_AND,         1,  2},
137     {WINED3D_SM4_OP_BREAK,      WINED3DSIH_BREAK,       0,  0},
138     {WINED3D_SM4_OP_BREAKC,     WINED3DSIH_BREAKP,      0,  1},
139     {WINED3D_SM4_OP_CUT,        WINED3DSIH_CUT,         0,  0},
140     {WINED3D_SM4_OP_DIV,        WINED3DSIH_DIV,         1,  2},
141     {WINED3D_SM4_OP_DP3,        WINED3DSIH_DP3,         1,  2},
142     {WINED3D_SM4_OP_DP4,        WINED3DSIH_DP4,         1,  2},
143     {WINED3D_SM4_OP_EMIT,       WINED3DSIH_EMIT,        0,  0},
144     {WINED3D_SM4_OP_ENDIF,      WINED3DSIH_ENDIF,       0,  0},
145     {WINED3D_SM4_OP_ENDLOOP,    WINED3DSIH_ENDLOOP,     0,  0},
146     {WINED3D_SM4_OP_EXP,        WINED3DSIH_EXP,         1,  1},
147     {WINED3D_SM4_OP_FRC,        WINED3DSIH_FRC,         1,  1},
148     {WINED3D_SM4_OP_FTOI,       WINED3DSIH_FTOI,        1,  1},
149     {WINED3D_SM4_OP_IADD,       WINED3DSIH_IADD,        1,  2},
150     {WINED3D_SM4_OP_IF,         WINED3DSIH_IF,          0,  1},
151     {WINED3D_SM4_OP_IEQ,        WINED3DSIH_IEQ,         1,  2},
152     {WINED3D_SM4_OP_IGE,        WINED3DSIH_IGE,         1,  2},
153     {WINED3D_SM4_OP_IMUL,       WINED3DSIH_IMUL,        2,  2},
154     {WINED3D_SM4_OP_ITOF,       WINED3DSIH_ITOF,        1,  1},
155     {WINED3D_SM4_OP_LD,         WINED3DSIH_LD,          1,  2},
156     {WINED3D_SM4_OP_LOG,        WINED3DSIH_LOG,         1,  1},
157     {WINED3D_SM4_OP_LOOP,       WINED3DSIH_LOOP,        0,  0},
158     {WINED3D_SM4_OP_LT,         WINED3DSIH_LT,          1,  2},
159     {WINED3D_SM4_OP_MAD,        WINED3DSIH_MAD,         1,  3},
160     {WINED3D_SM4_OP_MIN,        WINED3DSIH_MIN,         1,  2},
161     {WINED3D_SM4_OP_MAX,        WINED3DSIH_MAX,         1,  2},
162     {WINED3D_SM4_OP_MOV,        WINED3DSIH_MOV,         1,  1},
163     {WINED3D_SM4_OP_MOVC,       WINED3DSIH_MOVC,        1,  3},
164     {WINED3D_SM4_OP_MUL,        WINED3DSIH_MUL,         1,  2},
165     {WINED3D_SM4_OP_RET,        WINED3DSIH_RET,         0,  0},
166     {WINED3D_SM4_OP_RSQ,        WINED3DSIH_RSQ,         1,  1},
167     {WINED3D_SM4_OP_SAMPLE,     WINED3DSIH_SAMPLE,      1,  3},
168     {WINED3D_SM4_OP_SAMPLE_LOD, WINED3DSIH_SAMPLE_LOD,  1,  4},
169     {WINED3D_SM4_OP_SAMPLE_GRAD,WINED3DSIH_SAMPLE_GRAD, 1,  5},
170     {WINED3D_SM4_OP_SINCOS,     WINED3DSIH_SINCOS,      2,  1},
171     {WINED3D_SM4_OP_UTOF,       WINED3DSIH_UTOF,        1,  1},
172 };
173
174 static const WINED3DSHADER_PARAM_REGISTER_TYPE register_type_table[] =
175 {
176     /* WINED3D_SM4_RT_TEMP */           WINED3DSPR_TEMP,
177     /* WINED3D_SM4_RT_INPUT */          WINED3DSPR_INPUT,
178     /* WINED3D_SM4_RT_OUTPUT */         WINED3DSPR_OUTPUT,
179     /* UNKNOWN */                       0,
180     /* WINED3D_SM4_RT_IMMCONST */       WINED3DSPR_IMMCONST,
181     /* UNKNOWN */                       0,
182     /* WINED3D_SM4_RT_SAMPLER */        WINED3DSPR_SAMPLER,
183     /* WINED3D_SM4_RT_RESOURCE */       WINED3DSPR_RESOURCE,
184     /* WINED3D_SM4_RT_CONSTBUFFER */    WINED3DSPR_CONSTBUFFER,
185     /* UNKNOWN */                       0,
186     /* UNKNOWN */                       0,
187     /* UNKNOWN */                       0,
188     /* UNKNOWN */                       0,
189     /* WINED3D_SM4_RT_NULL */           WINED3DSPR_NULL,
190 };
191
192 static const struct sysval_map sysval_map[] =
193 {
194     {WINED3D_SV_DEPTH,      WINED3DSPR_DEPTHOUT,    0},
195     {WINED3D_SV_TARGET0,    WINED3DSPR_COLOROUT,    0},
196     {WINED3D_SV_TARGET1,    WINED3DSPR_COLOROUT,    1},
197     {WINED3D_SV_TARGET2,    WINED3DSPR_COLOROUT,    2},
198     {WINED3D_SV_TARGET3,    WINED3DSPR_COLOROUT,    3},
199     {WINED3D_SV_TARGET4,    WINED3DSPR_COLOROUT,    4},
200     {WINED3D_SV_TARGET5,    WINED3DSPR_COLOROUT,    5},
201     {WINED3D_SV_TARGET6,    WINED3DSPR_COLOROUT,    6},
202     {WINED3D_SV_TARGET7,    WINED3DSPR_COLOROUT,    7},
203 };
204
205 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
206 {
207     unsigned int i;
208
209     for (i = 0; i < sizeof(opcode_table) / sizeof(*opcode_table); ++i)
210     {
211         if (opcode == opcode_table[i].opcode) return &opcode_table[i];
212     }
213
214     return NULL;
215 }
216
217 static void map_sysval(enum wined3d_sysval_semantic sysval, struct wined3d_shader_register *reg)
218 {
219     unsigned int i;
220
221     for (i = 0; i < sizeof(sysval_map) / sizeof(*sysval_map); ++i)
222     {
223         if (sysval == sysval_map[i].sysval)
224         {
225             reg->type = sysval_map[i].register_type;
226             reg->idx = sysval_map[i].register_idx;
227         }
228     }
229 }
230
231 static void map_register(struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
232 {
233     switch (priv->shader_version.type)
234     {
235         case WINED3D_SHADER_TYPE_PIXEL:
236             if (reg->type == WINED3DSPR_OUTPUT)
237             {
238                 unsigned int i;
239                 const struct wined3d_shader_signature *s = priv->output_signature;
240
241                 if (!s)
242                 {
243                     ERR("Shader has no output signature, unable to map register.\n");
244                     break;
245                 }
246
247                 for (i = 0; i < s->element_count; ++i)
248                 {
249                     if (s->elements[i].register_idx == reg->idx)
250                     {
251                         map_sysval(s->elements[i].sysval_semantic, reg);
252                         break;
253                     }
254                 }
255             }
256             break;
257
258         default:
259             break;
260     }
261 }
262
263 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
264 {
265     struct wined3d_sm4_data *priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv));
266     if (!priv)
267     {
268         ERR("Failed to allocate private data\n");
269         return NULL;
270     }
271
272     priv->output_signature = output_signature;
273
274     return priv;
275 }
276
277 static void shader_sm4_free(void *data)
278 {
279     HeapFree(GetProcessHeap(), 0, data);
280 }
281
282 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
283 {
284     struct wined3d_sm4_data *priv = data;
285     DWORD version_token;
286
287     priv->end = *ptr;
288
289     version_token = *(*ptr)++;
290     TRACE("version: 0x%08x\n", version_token);
291
292     TRACE("token count: %u\n", **ptr);
293     priv->end += *(*ptr)++;
294
295     switch (version_token >> 16)
296     {
297         case WINED3D_SM4_PS:
298             priv->shader_version.type = WINED3D_SHADER_TYPE_PIXEL;
299             break;
300
301         case WINED3D_SM4_VS:
302             priv->shader_version.type = WINED3D_SHADER_TYPE_VERTEX;
303             break;
304
305         case WINED3D_SM4_GS:
306             priv->shader_version.type = WINED3D_SHADER_TYPE_GEOMETRY;
307             break;
308
309         default:
310             FIXME("Unrecognized shader type %#x\n", version_token >> 16);
311     }
312     priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
313     priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
314
315     *shader_version = priv->shader_version;
316 }
317
318 static void shader_sm4_read_opcode(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins,
319         UINT *param_size)
320 {
321     const struct wined3d_sm4_opcode_info *opcode_info;
322     DWORD token = *(*ptr)++;
323     DWORD opcode = token & WINED3D_SM4_OPCODE_MASK;
324
325     *param_size = ((token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT) - 1;
326
327     opcode_info = get_opcode_info(opcode);
328     if (!opcode_info)
329     {
330         FIXME("Unrecognized opcode %#x, token 0x%08x\n", opcode, token);
331         ins->handler_idx = WINED3DSIH_TABLE_SIZE;
332         return;
333     }
334
335     ins->handler_idx = opcode_info->handler_idx;
336     ins->flags = 0;
337     ins->coissue = 0;
338     ins->predicate = 0;
339     ins->dst_count = opcode_info->dst_count;
340     ins->src_count = opcode_info->src_count;
341
342     if (token & WINED3D_SM4_INSTRUCTION_MODIFIER)
343     {
344         DWORD modifier = *(*ptr)++;
345         FIXME("Skipping modifier 0x%08x.\n", modifier);
346     }
347 }
348
349 static void shader_sm4_read_src_param(void *data, const DWORD **ptr, struct wined3d_shader_src_param *src_param,
350         struct wined3d_shader_src_param *src_rel_addr)
351 {
352     struct wined3d_sm4_data *priv = data;
353     DWORD token = *(*ptr)++;
354     enum wined3d_sm4_register_type register_type;
355     DWORD order;
356
357     register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
358     if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
359     {
360         FIXME("Unhandled register type %#x\n", register_type);
361         src_param->reg.type = WINED3DSPR_TEMP;
362     }
363     else
364     {
365         src_param->reg.type = register_type_table[register_type];
366     }
367
368     if (token & WINED3D_SM4_REGISTER_MODIFIER)
369     {
370         DWORD modifier = *(*ptr)++;
371
372         /* FIXME: This will probably break down at some point. The SM4
373          * modifiers look like flags, while wined3d currently has an enum
374          * with possible combinations, e.g. WINED3DSPSM_ABSNEG. */
375         switch (modifier)
376         {
377             case 0x41:
378                 src_param->modifiers = WINED3DSPSM_NEG;
379                 break;
380
381             case 0x81:
382                 src_param->modifiers = WINED3DSPSM_ABS;
383                 break;
384
385             default:
386                 FIXME("Skipping modifier 0x%08x.\n", modifier);
387                 src_param->modifiers = WINED3DSPSM_NONE;
388                 break;
389         }
390     }
391     else
392     {
393         src_param->modifiers = WINED3DSPSM_NONE;
394     }
395
396     order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
397
398     if (order < 1) src_param->reg.idx = ~0U;
399     else src_param->reg.idx = *(*ptr)++;
400
401     if (order < 2) src_param->reg.array_idx = ~0U;
402     else src_param->reg.array_idx = *(*ptr)++;
403
404     if (order > 2) FIXME("Unhandled order %u.\n", order);
405
406     if (register_type == WINED3D_SM4_RT_IMMCONST)
407     {
408         enum wined3d_sm4_immconst_type immconst_type =
409                 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
410         src_param->swizzle = WINED3DSP_NOSWIZZLE;
411
412         switch(immconst_type)
413         {
414             case WINED3D_SM4_IMMCONST_SCALAR:
415                 src_param->reg.immconst_type = WINED3D_IMMCONST_SCALAR;
416                 memcpy(src_param->reg.immconst_data, *ptr, 1 * sizeof(DWORD));
417                 *ptr += 1;
418                 break;
419
420             case WINED3D_SM4_IMMCONST_VEC4:
421                 src_param->reg.immconst_type = WINED3D_IMMCONST_VEC4;
422                 memcpy(src_param->reg.immconst_data, *ptr, 4 * sizeof(DWORD));
423                 *ptr += 4;
424                 break;
425
426             default:
427                 FIXME("Unhandled immediate constant type %#x\n", immconst_type);
428                 break;
429         }
430     }
431     else
432     {
433         src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
434     }
435
436     src_param->reg.rel_addr = NULL;
437
438     map_register(priv, &src_param->reg);
439 }
440
441 static void shader_sm4_read_dst_param(void *data, const DWORD **ptr, struct wined3d_shader_dst_param *dst_param,
442         struct wined3d_shader_src_param *dst_rel_addr)
443 {
444     struct wined3d_sm4_data *priv = data;
445     DWORD token = *(*ptr)++;
446     enum wined3d_sm4_register_type register_type;
447     DWORD order;
448
449     register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
450     if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
451     {
452         FIXME("Unhandled register type %#x\n", register_type);
453         dst_param->reg.type = WINED3DSPR_TEMP;
454     }
455     else
456     {
457         dst_param->reg.type = register_type_table[register_type];
458     }
459
460     order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
461
462     if (order < 1) dst_param->reg.idx = ~0U;
463     else dst_param->reg.idx = *(*ptr)++;
464
465     if (order < 2) dst_param->reg.array_idx = ~0U;
466     else dst_param->reg.array_idx = *(*ptr)++;
467
468     if (order > 2) FIXME("Unhandled order %u.\n", order);
469
470     dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
471     dst_param->modifiers = 0;
472     dst_param->shift = 0;
473     dst_param->reg.rel_addr = NULL;
474
475     map_register(priv, &dst_param->reg);
476 }
477
478 static void shader_sm4_read_semantic(const DWORD **ptr, struct wined3d_shader_semantic *semantic)
479 {
480     FIXME("ptr %p, semantic %p stub!\n", ptr, semantic);
481 }
482
483 static void shader_sm4_read_comment(const DWORD **ptr, const char **comment, UINT *comment_size)
484 {
485     FIXME("ptr %p, comment %p, comment_size %p stub!\n", ptr, comment, comment_size);
486     *comment = NULL;
487 }
488
489 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
490 {
491     struct wined3d_sm4_data *priv = data;
492     return *ptr == priv->end;
493 }
494
495 const struct wined3d_shader_frontend sm4_shader_frontend =
496 {
497     shader_sm4_init,
498     shader_sm4_free,
499     shader_sm4_read_header,
500     shader_sm4_read_opcode,
501     shader_sm4_read_src_param,
502     shader_sm4_read_dst_param,
503     shader_sm4_read_semantic,
504     shader_sm4_read_comment,
505     shader_sm4_is_end,
506 };