[WINED3D]
[reactos.git] / reactos / dll / directx / wine / wined3d / shader_sm4.c
1 /*
2 * Copyright 2009 Henri Verbeet for CodeWeavers
3 *
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
8 *
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 *
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
17 */
18
19 #include "config.h"
20 #include "wine/port.h"
21
22 #include "wined3d_private.h"
23
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
25
26 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
27 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0xf << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
28
29 #define WINED3D_SM4_OPCODE_MASK 0xff
30
31 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
32 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3 << WINED3D_SM4_REGISTER_ORDER_SHIFT)
33
34 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
35 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xf << WINED3D_SM4_REGISTER_TYPE_SHIFT)
36
37 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT 0
38 #define WINED3D_SM4_IMMCONST_TYPE_MASK (0x3 << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
39
40 #define WINED3D_SM4_WRITEMASK_SHIFT 4
41 #define WINED3D_SM4_WRITEMASK_MASK (0xf << WINED3D_SM4_WRITEMASK_SHIFT)
42
43 #define WINED3D_SM4_SWIZZLE_SHIFT 4
44 #define WINED3D_SM4_SWIZZLE_MASK (0xff << WINED3D_SM4_SWIZZLE_SHIFT)
45
46 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
47 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
48
49 enum wined3d_sm4_opcode
50 {
51 WINED3D_SM4_OP_ADD = 0x00,
52 WINED3D_SM4_OP_AND = 0x01,
53 WINED3D_SM4_OP_BREAK = 0x02,
54 WINED3D_SM4_OP_BREAKC = 0x03,
55 WINED3D_SM4_OP_CUT = 0x09,
56 WINED3D_SM4_OP_DP3 = 0x10,
57 WINED3D_SM4_OP_DP4 = 0x11,
58 WINED3D_SM4_OP_EMIT = 0x13,
59 WINED3D_SM4_OP_ENDIF = 0x15,
60 WINED3D_SM4_OP_ENDLOOP = 0x16,
61 WINED3D_SM4_OP_EXP = 0x19,
62 WINED3D_SM4_OP_FRC = 0x1a,
63 WINED3D_SM4_OP_IADD = 0x1e,
64 WINED3D_SM4_OP_IF = 0x1f,
65 WINED3D_SM4_OP_IGE = 0x21,
66 WINED3D_SM4_OP_IMUL = 0x26,
67 WINED3D_SM4_OP_LOG = 0x2f,
68 WINED3D_SM4_OP_LOOP = 0x30,
69 WINED3D_SM4_OP_LT = 0x31,
70 WINED3D_SM4_OP_MAD = 0x32,
71 WINED3D_SM4_OP_MIN = 0x33,
72 WINED3D_SM4_OP_MAX = 0x34,
73 WINED3D_SM4_OP_MOV = 0x36,
74 WINED3D_SM4_OP_MOVC = 0x37,
75 WINED3D_SM4_OP_MUL = 0x38,
76 WINED3D_SM4_OP_RET = 0x3e,
77 WINED3D_SM4_OP_RSQ = 0x44,
78 WINED3D_SM4_OP_SINCOS = 0x4d,
79 };
80
81 enum wined3d_sm4_register_type
82 {
83 WINED3D_SM4_RT_TEMP = 0x0,
84 WINED3D_SM4_RT_INPUT = 0x1,
85 WINED3D_SM4_RT_OUTPUT = 0x2,
86 WINED3D_SM4_RT_IMMCONST = 0x4,
87 WINED3D_SM4_RT_CONSTBUFFER = 0x8,
88 WINED3D_SM4_RT_NULL = 0xd,
89 };
90
91 enum wined3d_sm4_immconst_type
92 {
93 WINED3D_SM4_IMMCONST_SCALAR = 0x1,
94 WINED3D_SM4_IMMCONST_VEC4 = 0x2,
95 };
96
97 struct wined3d_sm4_data
98 {
99 struct wined3d_shader_version shader_version;
100 const DWORD *end;
101 const struct wined3d_shader_signature *output_signature;
102 };
103
104 struct wined3d_sm4_opcode_info
105 {
106 enum wined3d_sm4_opcode opcode;
107 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
108 UINT dst_count;
109 UINT src_count;
110 };
111
112 struct sysval_map
113 {
114 enum wined3d_sysval_semantic sysval;
115 WINED3DSHADER_PARAM_REGISTER_TYPE register_type;
116 UINT register_idx;
117 };
118
119 static const struct wined3d_sm4_opcode_info opcode_table[] =
120 {
121 {WINED3D_SM4_OP_ADD, WINED3DSIH_ADD, 1, 2},
122 {WINED3D_SM4_OP_AND, WINED3DSIH_AND, 1, 2},
123 {WINED3D_SM4_OP_BREAK, WINED3DSIH_BREAK, 0, 0},
124 {WINED3D_SM4_OP_BREAKC, WINED3DSIH_BREAKP, 0, 1},
125 {WINED3D_SM4_OP_CUT, WINED3DSIH_CUT, 0, 0},
126 {WINED3D_SM4_OP_DP3, WINED3DSIH_DP3, 1, 2},
127 {WINED3D_SM4_OP_DP4, WINED3DSIH_DP4, 1, 2},
128 {WINED3D_SM4_OP_EMIT, WINED3DSIH_EMIT, 0, 0},
129 {WINED3D_SM4_OP_ENDIF, WINED3DSIH_ENDIF, 0, 0},
130 {WINED3D_SM4_OP_ENDLOOP,WINED3DSIH_ENDLOOP, 0, 0},
131 {WINED3D_SM4_OP_EXP, WINED3DSIH_EXP, 1, 1},
132 {WINED3D_SM4_OP_FRC, WINED3DSIH_FRC, 1, 1},
133 {WINED3D_SM4_OP_IADD, WINED3DSIH_IADD, 1, 2},
134 {WINED3D_SM4_OP_IF, WINED3DSIH_IF, 0, 1},
135 {WINED3D_SM4_OP_IGE, WINED3DSIH_IGE, 1, 2},
136 {WINED3D_SM4_OP_IMUL, WINED3DSIH_IMUL, 2, 2},
137 {WINED3D_SM4_OP_LOG, WINED3DSIH_LOG, 1, 1},
138 {WINED3D_SM4_OP_LOOP, WINED3DSIH_LOOP, 0, 0},
139 {WINED3D_SM4_OP_LT, WINED3DSIH_LT, 1, 2},
140 {WINED3D_SM4_OP_MAD, WINED3DSIH_MAD, 1, 3},
141 {WINED3D_SM4_OP_MIN, WINED3DSIH_MIN, 1, 2},
142 {WINED3D_SM4_OP_MAX, WINED3DSIH_MAX, 1, 2},
143 {WINED3D_SM4_OP_MOV, WINED3DSIH_MOV, 1, 1},
144 {WINED3D_SM4_OP_MOVC, WINED3DSIH_MOVC, 1, 3},
145 {WINED3D_SM4_OP_MUL, WINED3DSIH_MUL, 1, 2},
146 {WINED3D_SM4_OP_RET, WINED3DSIH_RET, 0, 0},
147 {WINED3D_SM4_OP_RSQ, WINED3DSIH_RSQ, 1, 1},
148 {WINED3D_SM4_OP_SINCOS, WINED3DSIH_SINCOS, 2, 1},
149 };
150
151 static const WINED3DSHADER_PARAM_REGISTER_TYPE register_type_table[] =
152 {
153 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP,
154 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT,
155 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT,
156 /* UNKNOWN */ 0,
157 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST,
158 /* UNKNOWN */ 0,
159 /* UNKNOWN */ 0,
160 /* UNKNOWN */ 0,
161 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER,
162 /* UNKNOWN */ 0,
163 /* UNKNOWN */ 0,
164 /* UNKNOWN */ 0,
165 /* UNKNOWN */ 0,
166 /* WINED3D_SM4_RT_NULL */ WINED3DSPR_NULL,
167 };
168
169 static const struct sysval_map sysval_map[] =
170 {
171 {WINED3D_SV_DEPTH, WINED3DSPR_DEPTHOUT, 0},
172 {WINED3D_SV_TARGET0, WINED3DSPR_COLOROUT, 0},
173 {WINED3D_SV_TARGET1, WINED3DSPR_COLOROUT, 1},
174 {WINED3D_SV_TARGET2, WINED3DSPR_COLOROUT, 2},
175 {WINED3D_SV_TARGET3, WINED3DSPR_COLOROUT, 3},
176 {WINED3D_SV_TARGET4, WINED3DSPR_COLOROUT, 4},
177 {WINED3D_SV_TARGET5, WINED3DSPR_COLOROUT, 5},
178 {WINED3D_SV_TARGET6, WINED3DSPR_COLOROUT, 6},
179 {WINED3D_SV_TARGET7, WINED3DSPR_COLOROUT, 7},
180 };
181
182 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
183 {
184 unsigned int i;
185
186 for (i = 0; i < sizeof(opcode_table) / sizeof(*opcode_table); ++i)
187 {
188 if (opcode == opcode_table[i].opcode) return &opcode_table[i];
189 }
190
191 return NULL;
192 }
193
194 static void map_sysval(enum wined3d_sysval_semantic sysval, struct wined3d_shader_register *reg)
195 {
196 unsigned int i;
197
198 for (i = 0; i < sizeof(sysval_map) / sizeof(*sysval_map); ++i)
199 {
200 if (sysval == sysval_map[i].sysval)
201 {
202 reg->type = sysval_map[i].register_type;
203 reg->idx = sysval_map[i].register_idx;
204 }
205 }
206 }
207
208 static void map_register(struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
209 {
210 switch (priv->shader_version.type)
211 {
212 case WINED3D_SHADER_TYPE_PIXEL:
213 if (reg->type == WINED3DSPR_OUTPUT)
214 {
215 unsigned int i;
216 const struct wined3d_shader_signature *s = priv->output_signature;
217
218 if (!s)
219 {
220 ERR("Shader has no output signature, unable to map register.\n");
221 break;
222 }
223
224 for (i = 0; i < s->element_count; ++i)
225 {
226 if (s->elements[i].register_idx == reg->idx)
227 {
228 map_sysval(s->elements[i].sysval_semantic, reg);
229 break;
230 }
231 }
232 }
233 break;
234
235 default:
236 break;
237 }
238 }
239
240 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
241 {
242 struct wined3d_sm4_data *priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv));
243 if (!priv)
244 {
245 ERR("Failed to allocate private data\n");
246 return NULL;
247 }
248
249 priv->output_signature = output_signature;
250
251 return priv;
252 }
253
254 static void shader_sm4_free(void *data)
255 {
256 HeapFree(GetProcessHeap(), 0, data);
257 }
258
259 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
260 {
261 struct wined3d_sm4_data *priv = data;
262 DWORD version_token;
263
264 priv->end = *ptr;
265
266 version_token = *(*ptr)++;
267 TRACE("version: 0x%08x\n", version_token);
268
269 TRACE("token count: %u\n", **ptr);
270 priv->end += *(*ptr)++;
271
272 switch (version_token >> 16)
273 {
274 case WINED3D_SM4_PS:
275 priv->shader_version.type = WINED3D_SHADER_TYPE_PIXEL;
276 break;
277
278 case WINED3D_SM4_VS:
279 priv->shader_version.type = WINED3D_SHADER_TYPE_VERTEX;
280 break;
281
282 case WINED3D_SM4_GS:
283 priv->shader_version.type = WINED3D_SHADER_TYPE_GEOMETRY;
284 break;
285
286 default:
287 FIXME("Unrecognized shader type %#x\n", version_token >> 16);
288 }
289 priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
290 priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
291
292 *shader_version = priv->shader_version;
293 }
294
295 static void shader_sm4_read_opcode(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins,
296 UINT *param_size)
297 {
298 const struct wined3d_sm4_opcode_info *opcode_info;
299 DWORD token = *(*ptr)++;
300 DWORD opcode = token & WINED3D_SM4_OPCODE_MASK;
301
302 *param_size = ((token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT) - 1;
303
304 opcode_info = get_opcode_info(opcode);
305 if (!opcode_info)
306 {
307 FIXME("Unrecognized opcode %#x, token 0x%08x\n", opcode, token);
308 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
309 return;
310 }
311
312 ins->handler_idx = opcode_info->handler_idx;
313 ins->flags = 0;
314 ins->coissue = 0;
315 ins->predicate = 0;
316 ins->dst_count = opcode_info->dst_count;
317 ins->src_count = opcode_info->src_count;
318 }
319
320 static void shader_sm4_read_src_param(void *data, const DWORD **ptr, struct wined3d_shader_src_param *src_param,
321 struct wined3d_shader_src_param *src_rel_addr)
322 {
323 struct wined3d_sm4_data *priv = data;
324 DWORD token = *(*ptr)++;
325 enum wined3d_sm4_register_type register_type;
326 DWORD order;
327
328 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
329 if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
330 {
331 FIXME("Unhandled register type %#x\n", register_type);
332 src_param->reg.type = WINED3DSPR_TEMP;
333 }
334 else
335 {
336 src_param->reg.type = register_type_table[register_type];
337 }
338
339 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
340
341 if (order < 1) src_param->reg.idx = ~0U;
342 else src_param->reg.idx = *(*ptr)++;
343
344 if (order < 2) src_param->reg.array_idx = ~0U;
345 else src_param->reg.array_idx = *(*ptr)++;
346
347 if (order > 2) FIXME("Unhandled order %u.\n", order);
348
349 if (register_type == WINED3D_SM4_RT_IMMCONST)
350 {
351 enum wined3d_sm4_immconst_type immconst_type =
352 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
353 src_param->swizzle = WINED3DSP_NOSWIZZLE;
354
355 switch(immconst_type)
356 {
357 case WINED3D_SM4_IMMCONST_SCALAR:
358 src_param->reg.immconst_type = WINED3D_IMMCONST_SCALAR;
359 memcpy(src_param->reg.immconst_data, *ptr, 1 * sizeof(DWORD));
360 *ptr += 1;
361 break;
362
363 case WINED3D_SM4_IMMCONST_VEC4:
364 src_param->reg.immconst_type = WINED3D_IMMCONST_VEC4;
365 memcpy(src_param->reg.immconst_data, *ptr, 4 * sizeof(DWORD));
366 *ptr += 4;
367 break;
368
369 default:
370 FIXME("Unhandled immediate constant type %#x\n", immconst_type);
371 break;
372 }
373 }
374 else
375 {
376 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
377 }
378
379 src_param->modifiers = 0;
380 src_param->reg.rel_addr = NULL;
381
382 map_register(priv, &src_param->reg);
383 }
384
385 static void shader_sm4_read_dst_param(void *data, const DWORD **ptr, struct wined3d_shader_dst_param *dst_param,
386 struct wined3d_shader_src_param *dst_rel_addr)
387 {
388 struct wined3d_sm4_data *priv = data;
389 DWORD token = *(*ptr)++;
390 enum wined3d_sm4_register_type register_type;
391 DWORD order;
392
393 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
394 if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
395 {
396 FIXME("Unhandled register type %#x\n", register_type);
397 dst_param->reg.type = WINED3DSPR_TEMP;
398 }
399 else
400 {
401 dst_param->reg.type = register_type_table[register_type];
402 }
403
404 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
405
406 if (order < 1) dst_param->reg.idx = ~0U;
407 else dst_param->reg.idx = *(*ptr)++;
408
409 if (order < 2) dst_param->reg.array_idx = ~0U;
410 else dst_param->reg.array_idx = *(*ptr)++;
411
412 if (order > 2) FIXME("Unhandled order %u.\n", order);
413
414 dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
415 dst_param->modifiers = 0;
416 dst_param->shift = 0;
417 dst_param->reg.rel_addr = NULL;
418
419 map_register(priv, &dst_param->reg);
420 }
421
422 static void shader_sm4_read_semantic(const DWORD **ptr, struct wined3d_shader_semantic *semantic)
423 {
424 FIXME("ptr %p, semantic %p stub!\n", ptr, semantic);
425 }
426
427 static void shader_sm4_read_comment(const DWORD **ptr, const char **comment, UINT *comment_size)
428 {
429 FIXME("ptr %p, comment %p, comment_size %p stub!\n", ptr, comment, comment_size);
430 *comment = NULL;
431 }
432
433 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
434 {
435 struct wined3d_sm4_data *priv = data;
436 return *ptr == priv->end;
437 }
438
439 const struct wined3d_shader_frontend sm4_shader_frontend =
440 {
441 shader_sm4_init,
442 shader_sm4_free,
443 shader_sm4_read_header,
444 shader_sm4_read_opcode,
445 shader_sm4_read_src_param,
446 shader_sm4_read_dst_param,
447 shader_sm4_read_semantic,
448 shader_sm4_read_comment,
449 shader_sm4_is_end,
450 };