wined3d: Don't respecify compressed textures in surface_upload_data().
[wine] / dlls / wined3d / shader_sm4.c
1 /*
2  * Copyright 2009 Henri Verbeet for CodeWeavers
3  *
4  * This library is free software; you can redistribute it and/or
5  * modify it under the terms of the GNU Lesser General Public
6  * License as published by the Free Software Foundation; either
7  * version 2.1 of the License, or (at your option) any later version.
8  *
9  * This library is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12  * Lesser General Public License for more details.
13  *
14  * You should have received a copy of the GNU Lesser General Public
15  * License along with this library; if not, write to the Free Software
16  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
17  */
18
19 #include "config.h"
20 #include "wine/port.h"
21
22 #include "wined3d_private.h"
23
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
25
26 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT    24
27 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK     (0xf << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
28
29 #define WINED3D_SM4_OPCODE_MASK                 0xff
30
31 #define WINED3D_SM4_REGISTER_ORDER_SHIFT        20
32 #define WINED3D_SM4_REGISTER_ORDER_MASK         (0x3 << WINED3D_SM4_REGISTER_ORDER_SHIFT)
33
34 #define WINED3D_SM4_REGISTER_TYPE_SHIFT         12
35 #define WINED3D_SM4_REGISTER_TYPE_MASK          (0xf << WINED3D_SM4_REGISTER_TYPE_SHIFT)
36
37 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT         0
38 #define WINED3D_SM4_IMMCONST_TYPE_MASK          (0x3 << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
39
40 #define WINED3D_SM4_WRITEMASK_SHIFT             4
41 #define WINED3D_SM4_WRITEMASK_MASK              (0xf << WINED3D_SM4_WRITEMASK_SHIFT)
42
43 #define WINED3D_SM4_SWIZZLE_SHIFT               4
44 #define WINED3D_SM4_SWIZZLE_MASK                (0xff << WINED3D_SM4_SWIZZLE_SHIFT)
45
46 #define WINED3D_SM4_VERSION_MAJOR(version)      (((version) >> 4) & 0xf)
47 #define WINED3D_SM4_VERSION_MINOR(version)      (((version) >> 0) & 0xf)
48
49 enum wined3d_sm4_opcode
50 {
51     WINED3D_SM4_OP_ADD      = 0x00,
52     WINED3D_SM4_OP_DP3      = 0x10,
53     WINED3D_SM4_OP_DP4      = 0x11,
54     WINED3D_SM4_OP_EXP      = 0x19,
55     WINED3D_SM4_OP_LOG      = 0x2f,
56     WINED3D_SM4_OP_MOV      = 0x36,
57     WINED3D_SM4_OP_MUL      = 0x38,
58     WINED3D_SM4_OP_RET      = 0x3e,
59     WINED3D_SM4_OP_RSQ      = 0x44,
60     WINED3D_SM4_OP_SINCOS   = 0x4d,
61 };
62
63 enum wined3d_sm4_register_type
64 {
65     WINED3D_SM4_RT_TEMP         = 0x0,
66     WINED3D_SM4_RT_INPUT        = 0x1,
67     WINED3D_SM4_RT_OUTPUT       = 0x2,
68     WINED3D_SM4_RT_IMMCONST     = 0x4,
69     WINED3D_SM4_RT_CONSTBUFFER  = 0x8,
70 };
71
72 enum wined3d_sm4_immconst_type
73 {
74     WINED3D_SM4_IMMCONST_FLOAT  = 0x1,
75     WINED3D_SM4_IMMCONST_FLOAT4 = 0x2,
76 };
77
78 struct wined3d_sm4_data
79 {
80     struct wined3d_shader_version shader_version;
81     const DWORD *end;
82     const struct wined3d_shader_signature *output_signature;
83 };
84
85 struct wined3d_sm4_opcode_info
86 {
87     enum wined3d_sm4_opcode opcode;
88     enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
89     UINT dst_count;
90     UINT src_count;
91 };
92
93 struct sysval_map
94 {
95     enum wined3d_sysval_semantic sysval;
96     WINED3DSHADER_PARAM_REGISTER_TYPE register_type;
97     UINT register_idx;
98 };
99
100 static const struct wined3d_sm4_opcode_info opcode_table[] =
101 {
102     {WINED3D_SM4_OP_ADD,    WINED3DSIH_ADD,         1,  2},
103     {WINED3D_SM4_OP_DP3,    WINED3DSIH_DP3,         1,  2},
104     {WINED3D_SM4_OP_DP4,    WINED3DSIH_DP4,         1,  2},
105     {WINED3D_SM4_OP_EXP,    WINED3DSIH_EXP,         1,  1},
106     {WINED3D_SM4_OP_LOG,    WINED3DSIH_LOG,         1,  1},
107     {WINED3D_SM4_OP_MOV,    WINED3DSIH_MOV,         1,  1},
108     {WINED3D_SM4_OP_MUL,    WINED3DSIH_MUL,         1,  2},
109     {WINED3D_SM4_OP_RET,    WINED3DSIH_RET,         0,  0},
110     {WINED3D_SM4_OP_RSQ,    WINED3DSIH_RSQ,         1,  1},
111     {WINED3D_SM4_OP_SINCOS, WINED3DSIH_SINCOS,      1,  2},
112 };
113
114 static const WINED3DSHADER_PARAM_REGISTER_TYPE register_type_table[] =
115 {
116     /* WINED3D_SM4_RT_TEMP */           WINED3DSPR_TEMP,
117     /* WINED3D_SM4_RT_INPUT */          WINED3DSPR_INPUT,
118     /* WINED3D_SM4_RT_OUTPUT */         WINED3DSPR_OUTPUT,
119     /* UNKNOWN */                       0,
120     /* WINED3D_SM4_RT_IMMCONST */       WINED3DSPR_IMMCONST,
121     /* UNKNOWN */                       0,
122     /* UNKNOWN */                       0,
123     /* UNKNOWN */                       0,
124     /* WINED3D_SM4_RT_CONSTBUFFER */    WINED3DSPR_CONSTBUFFER,
125 };
126
127 static const struct sysval_map sysval_map[] =
128 {
129     {WINED3D_SV_DEPTH,      WINED3DSPR_DEPTHOUT,    0},
130     {WINED3D_SV_TARGET0,    WINED3DSPR_COLOROUT,    0},
131     {WINED3D_SV_TARGET1,    WINED3DSPR_COLOROUT,    1},
132     {WINED3D_SV_TARGET2,    WINED3DSPR_COLOROUT,    2},
133     {WINED3D_SV_TARGET3,    WINED3DSPR_COLOROUT,    3},
134     {WINED3D_SV_TARGET4,    WINED3DSPR_COLOROUT,    4},
135     {WINED3D_SV_TARGET5,    WINED3DSPR_COLOROUT,    5},
136     {WINED3D_SV_TARGET6,    WINED3DSPR_COLOROUT,    6},
137     {WINED3D_SV_TARGET7,    WINED3DSPR_COLOROUT,    7},
138 };
139
140 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
141 {
142     unsigned int i;
143
144     for (i = 0; i < sizeof(opcode_table) / sizeof(*opcode_table); ++i)
145     {
146         if (opcode == opcode_table[i].opcode) return &opcode_table[i];
147     }
148
149     return NULL;
150 }
151
152 static void map_sysval(enum wined3d_sysval_semantic sysval, struct wined3d_shader_register *reg)
153 {
154     unsigned int i;
155
156     for (i = 0; i < sizeof(sysval_map) / sizeof(*sysval_map); ++i)
157     {
158         if (sysval == sysval_map[i].sysval)
159         {
160             reg->type = sysval_map[i].register_type;
161             reg->idx = sysval_map[i].register_idx;
162         }
163     }
164 }
165
166 static void map_register(struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
167 {
168     switch (priv->shader_version.type)
169     {
170         case WINED3D_SHADER_TYPE_PIXEL:
171             if (reg->type == WINED3DSPR_OUTPUT)
172             {
173                 unsigned int i;
174                 const struct wined3d_shader_signature *s = priv->output_signature;
175
176                 if (!s)
177                 {
178                     ERR("Shader has no output signature, unable to map register.\n");
179                     break;
180                 }
181
182                 for (i = 0; i < s->element_count; ++i)
183                 {
184                     if (s->elements[i].register_idx == reg->idx)
185                     {
186                         map_sysval(s->elements[i].sysval_semantic, reg);
187                         break;
188                     }
189                 }
190             }
191             break;
192
193         default:
194             break;
195     }
196 }
197
198 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
199 {
200     struct wined3d_sm4_data *priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv));
201     if (!priv)
202     {
203         ERR("Failed to allocate private data\n");
204         return NULL;
205     }
206
207     priv->output_signature = output_signature;
208
209     return priv;
210 }
211
212 static void shader_sm4_free(void *data)
213 {
214     HeapFree(GetProcessHeap(), 0, data);
215 }
216
217 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
218 {
219     struct wined3d_sm4_data *priv = data;
220     DWORD version_token;
221
222     priv->end = *ptr;
223
224     version_token = *(*ptr)++;
225     TRACE("version: 0x%08x\n", version_token);
226
227     TRACE("token count: %u\n", **ptr);
228     priv->end += *(*ptr)++;
229
230     switch (version_token >> 16)
231     {
232         case WINED3D_SM4_PS:
233             priv->shader_version.type = WINED3D_SHADER_TYPE_PIXEL;
234             break;
235
236         case WINED3D_SM4_VS:
237             priv->shader_version.type = WINED3D_SHADER_TYPE_VERTEX;
238             break;
239
240         case WINED3D_SM4_GS:
241             priv->shader_version.type = WINED3D_SHADER_TYPE_GEOMETRY;
242             break;
243
244         default:
245             FIXME("Unrecognized shader type %#x\n", version_token >> 16);
246     }
247     priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
248     priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
249
250     *shader_version = priv->shader_version;
251 }
252
253 static void shader_sm4_read_opcode(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins,
254         UINT *param_size)
255 {
256     const struct wined3d_sm4_opcode_info *opcode_info;
257     DWORD token = *(*ptr)++;
258     DWORD opcode = token & WINED3D_SM4_OPCODE_MASK;
259
260     *param_size = ((token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT) - 1;
261
262     opcode_info = get_opcode_info(opcode);
263     if (!opcode_info)
264     {
265         FIXME("Unrecognized opcode %#x, token 0x%08x\n", opcode, token);
266         ins->handler_idx = WINED3DSIH_TABLE_SIZE;
267         return;
268     }
269
270     ins->handler_idx = opcode_info->handler_idx;
271     ins->flags = 0;
272     ins->coissue = 0;
273     ins->predicate = 0;
274     ins->dst_count = opcode_info->dst_count;
275     ins->src_count = opcode_info->src_count;
276 }
277
278 static void shader_sm4_read_src_param(void *data, const DWORD **ptr, struct wined3d_shader_src_param *src_param,
279         struct wined3d_shader_src_param *src_rel_addr)
280 {
281     struct wined3d_sm4_data *priv = data;
282     DWORD token = *(*ptr)++;
283     enum wined3d_sm4_register_type register_type;
284     DWORD order;
285
286     register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
287     if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
288     {
289         FIXME("Unhandled register type %#x\n", register_type);
290         src_param->reg.type = WINED3DSPR_TEMP;
291     }
292     else
293     {
294         src_param->reg.type = register_type_table[register_type];
295     }
296
297     order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
298
299     if (order < 1) src_param->reg.idx = ~0U;
300     else src_param->reg.idx = *(*ptr)++;
301
302     if (order < 2) src_param->reg.array_idx = ~0U;
303     else src_param->reg.array_idx = *(*ptr)++;
304
305     if (order > 2) FIXME("Unhandled order %u.\n", order);
306
307     if (register_type == WINED3D_SM4_RT_IMMCONST)
308     {
309         enum wined3d_sm4_immconst_type immconst_type =
310                 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
311         src_param->swizzle = WINED3DSP_NOSWIZZLE;
312
313         switch(immconst_type)
314         {
315             case WINED3D_SM4_IMMCONST_FLOAT:
316                 src_param->reg.immconst_type = WINED3D_IMMCONST_FLOAT;
317                 memcpy(src_param->reg.immconst_data, *ptr, 1 * sizeof(DWORD));
318                 *ptr += 1;
319                 break;
320
321             case WINED3D_SM4_IMMCONST_FLOAT4:
322                 src_param->reg.immconst_type = WINED3D_IMMCONST_FLOAT4;
323                 memcpy(src_param->reg.immconst_data, *ptr, 4 * sizeof(DWORD));
324                 *ptr += 4;
325                 break;
326
327             default:
328                 FIXME("Unhandled immediate constant type %#x\n", immconst_type);
329                 break;
330         }
331     }
332     else
333     {
334         src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
335     }
336
337     src_param->modifiers = 0;
338     src_param->reg.rel_addr = NULL;
339
340     map_register(priv, &src_param->reg);
341 }
342
343 static void shader_sm4_read_dst_param(void *data, const DWORD **ptr, struct wined3d_shader_dst_param *dst_param,
344         struct wined3d_shader_src_param *dst_rel_addr)
345 {
346     struct wined3d_sm4_data *priv = data;
347     DWORD token = *(*ptr)++;
348     enum wined3d_sm4_register_type register_type;
349     DWORD order;
350
351     register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
352     if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
353     {
354         FIXME("Unhandled register type %#x\n", register_type);
355         dst_param->reg.type = WINED3DSPR_TEMP;
356     }
357     else
358     {
359         dst_param->reg.type = register_type_table[register_type];
360     }
361
362     order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
363
364     if (order < 1) dst_param->reg.idx = ~0U;
365     else dst_param->reg.idx = *(*ptr)++;
366
367     if (order < 2) dst_param->reg.array_idx = ~0U;
368     else dst_param->reg.array_idx = *(*ptr)++;
369
370     if (order > 2) FIXME("Unhandled order %u.\n", order);
371
372     dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
373     dst_param->modifiers = 0;
374     dst_param->shift = 0;
375     dst_param->reg.rel_addr = NULL;
376
377     map_register(priv, &dst_param->reg);
378 }
379
380 static void shader_sm4_read_semantic(const DWORD **ptr, struct wined3d_shader_semantic *semantic)
381 {
382     FIXME("ptr %p, semantic %p stub!\n", ptr, semantic);
383 }
384
385 static void shader_sm4_read_comment(const DWORD **ptr, const char **comment)
386 {
387     FIXME("ptr %p, comment %p stub!\n", ptr, comment);
388     *comment = NULL;
389 }
390
391 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
392 {
393     struct wined3d_sm4_data *priv = data;
394     return *ptr == priv->end;
395 }
396
397 const struct wined3d_shader_frontend sm4_shader_frontend =
398 {
399     shader_sm4_init,
400     shader_sm4_free,
401     shader_sm4_read_header,
402     shader_sm4_read_opcode,
403     shader_sm4_read_src_param,
404     shader_sm4_read_dst_param,
405     shader_sm4_read_semantic,
406     shader_sm4_read_comment,
407     shader_sm4_is_end,
408 };