oledb32/tests: Improve IDataSourceLocator tests a bit.
[wine/multimedia.git] / dlls / wined3d / shader_sm4.c
blob9f8fe12b7f0618e9db52ea402ac084c21524e108
1 /*
2 * Copyright 2009 Henri Verbeet for CodeWeavers
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
19 #include "config.h"
20 #include "wine/port.h"
22 #include "wined3d_private.h"
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
25 WINE_DECLARE_DEBUG_CHANNEL(d3d_bytecode);
27 #define WINED3D_SM4_INSTRUCTION_MODIFIER (1 << 31)
29 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
30 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0x1f << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
32 #define WINED3D_SM4_RESOURCE_TYPE_SHIFT 11
33 #define WINED3D_SM4_RESOURCE_TYPE_MASK (0xf << WINED3D_SM4_RESOURCE_TYPE_SHIFT)
35 #define WINED3D_SM4_PRIMITIVE_TYPE_SHIFT 11
36 #define WINED3D_SM4_PRIMITIVE_TYPE_MASK (0x7 << WINED3D_SM4_PRIMITIVE_TYPE_SHIFT)
38 #define WINED3D_SM4_INDEX_TYPE_SHIFT 11
39 #define WINED3D_SM4_INDEX_TYPE_MASK (0x1 << WINED3D_SM4_INDEX_TYPE_SHIFT)
41 #define WINED3D_SM4_OPCODE_MASK 0xff
43 #define WINED3D_SM4_REGISTER_MODIFIER (1 << 31)
45 #define WINED3D_SM4_ADDRESSING_SHIFT1 25
46 #define WINED3D_SM4_ADDRESSING_MASK1 (0x3 << WINED3D_SM4_ADDRESSING_SHIFT1)
48 #define WINED3D_SM4_ADDRESSING_SHIFT0 22
49 #define WINED3D_SM4_ADDRESSING_MASK0 (0x3 << WINED3D_SM4_ADDRESSING_SHIFT0)
51 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
52 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3 << WINED3D_SM4_REGISTER_ORDER_SHIFT)
54 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
55 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xf << WINED3D_SM4_REGISTER_TYPE_SHIFT)
57 #define WINED3D_SM4_SWIZZLE_TYPE_SHIFT 2
58 #define WINED3D_SM4_SWIZZLE_TYPE_MASK (0x3 << WINED3D_SM4_SWIZZLE_TYPE_SHIFT)
60 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT 0
61 #define WINED3D_SM4_IMMCONST_TYPE_MASK (0x3 << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
63 #define WINED3D_SM4_WRITEMASK_SHIFT 4
64 #define WINED3D_SM4_WRITEMASK_MASK (0xf << WINED3D_SM4_WRITEMASK_SHIFT)
66 #define WINED3D_SM4_SWIZZLE_SHIFT 4
67 #define WINED3D_SM4_SWIZZLE_MASK (0xff << WINED3D_SM4_SWIZZLE_SHIFT)
69 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
70 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
72 #define WINED3D_SM4_ADDRESSING_RELATIVE 0x2
73 #define WINED3D_SM4_ADDRESSING_OFFSET 0x1
75 enum wined3d_sm4_opcode
77 WINED3D_SM4_OP_ADD = 0x00,
78 WINED3D_SM4_OP_AND = 0x01,
79 WINED3D_SM4_OP_BREAK = 0x02,
80 WINED3D_SM4_OP_BREAKC = 0x03,
81 WINED3D_SM4_OP_CUT = 0x09,
82 WINED3D_SM4_OP_DERIV_RTX = 0x0b,
83 WINED3D_SM4_OP_DERIV_RTY = 0x0c,
84 WINED3D_SM4_OP_DISCARD = 0x0d,
85 WINED3D_SM4_OP_DIV = 0x0e,
86 WINED3D_SM4_OP_DP2 = 0x0f,
87 WINED3D_SM4_OP_DP3 = 0x10,
88 WINED3D_SM4_OP_DP4 = 0x11,
89 WINED3D_SM4_OP_EMIT = 0x13,
90 WINED3D_SM4_OP_ENDIF = 0x15,
91 WINED3D_SM4_OP_ENDLOOP = 0x16,
92 WINED3D_SM4_OP_EQ = 0x18,
93 WINED3D_SM4_OP_EXP = 0x19,
94 WINED3D_SM4_OP_FRC = 0x1a,
95 WINED3D_SM4_OP_FTOI = 0x1b,
96 WINED3D_SM4_OP_GE = 0x1d,
97 WINED3D_SM4_OP_IADD = 0x1e,
98 WINED3D_SM4_OP_IF = 0x1f,
99 WINED3D_SM4_OP_IEQ = 0x20,
100 WINED3D_SM4_OP_IGE = 0x21,
101 WINED3D_SM4_OP_IMUL = 0x26,
102 WINED3D_SM4_OP_ISHL = 0x29,
103 WINED3D_SM4_OP_ITOF = 0x2b,
104 WINED3D_SM4_OP_LD = 0x2d,
105 WINED3D_SM4_OP_LOG = 0x2f,
106 WINED3D_SM4_OP_LOOP = 0x30,
107 WINED3D_SM4_OP_LT = 0x31,
108 WINED3D_SM4_OP_MAD = 0x32,
109 WINED3D_SM4_OP_MIN = 0x33,
110 WINED3D_SM4_OP_MAX = 0x34,
111 WINED3D_SM4_OP_MOV = 0x36,
112 WINED3D_SM4_OP_MOVC = 0x37,
113 WINED3D_SM4_OP_MUL = 0x38,
114 WINED3D_SM4_OP_NE = 0x39,
115 WINED3D_SM4_OP_OR = 0x3c,
116 WINED3D_SM4_OP_RET = 0x3e,
117 WINED3D_SM4_OP_ROUND_NI = 0x41,
118 WINED3D_SM4_OP_RSQ = 0x44,
119 WINED3D_SM4_OP_SAMPLE = 0x45,
120 WINED3D_SM4_OP_SAMPLE_LOD = 0x48,
121 WINED3D_SM4_OP_SAMPLE_GRAD = 0x49,
122 WINED3D_SM4_OP_SQRT = 0x4b,
123 WINED3D_SM4_OP_SINCOS = 0x4d,
124 WINED3D_SM4_OP_UDIV = 0x4e,
125 WINED3D_SM4_OP_UGE = 0x50,
126 WINED3D_SM4_OP_USHR = 0x55,
127 WINED3D_SM4_OP_UTOF = 0x56,
128 WINED3D_SM4_OP_XOR = 0x57,
129 WINED3D_SM4_OP_DCL_RESOURCE = 0x58,
130 WINED3D_SM4_OP_DCL_CONSTANT_BUFFER = 0x59,
131 WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY = 0x5c,
132 WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE = 0x5d,
133 WINED3D_SM4_OP_DCL_VERTICES_OUT = 0x5e,
136 enum wined3d_sm4_register_type
138 WINED3D_SM4_RT_TEMP = 0x0,
139 WINED3D_SM4_RT_INPUT = 0x1,
140 WINED3D_SM4_RT_OUTPUT = 0x2,
141 WINED3D_SM4_RT_IMMCONST = 0x4,
142 WINED3D_SM4_RT_SAMPLER = 0x6,
143 WINED3D_SM4_RT_RESOURCE = 0x7,
144 WINED3D_SM4_RT_CONSTBUFFER = 0x8,
145 WINED3D_SM4_RT_PRIMID = 0xb,
146 WINED3D_SM4_RT_NULL = 0xd,
149 enum wined3d_sm4_output_primitive_type
151 WINED3D_SM4_OUTPUT_PT_POINTLIST = 0x1,
152 WINED3D_SM4_OUTPUT_PT_LINELIST = 0x3,
153 WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP = 0x5,
156 enum wined3d_sm4_input_primitive_type
158 WINED3D_SM4_INPUT_PT_POINT = 0x1,
159 WINED3D_SM4_INPUT_PT_LINE = 0x2,
160 WINED3D_SM4_INPUT_PT_TRIANGLE = 0x3,
161 WINED3D_SM4_INPUT_PT_LINEADJ = 0x6,
162 WINED3D_SM4_INPUT_PT_TRIANGLEADJ = 0x7,
165 enum wined3d_sm4_swizzle_type
167 WINED3D_SM4_SWIZZLE_VEC4 = 0x1,
168 WINED3D_SM4_SWIZZLE_SCALAR = 0x2,
171 enum wined3d_sm4_immconst_type
173 WINED3D_SM4_IMMCONST_SCALAR = 0x1,
174 WINED3D_SM4_IMMCONST_VEC4 = 0x2,
177 enum wined3d_sm4_resource_type
179 WINED3D_SM4_RESOURCE_BUFFER = 0x1,
180 WINED3D_SM4_RESOURCE_TEXTURE_1D = 0x2,
181 WINED3D_SM4_RESOURCE_TEXTURE_2D = 0x3,
182 WINED3D_SM4_RESOURCE_TEXTURE_2DMS = 0x4,
183 WINED3D_SM4_RESOURCE_TEXTURE_3D = 0x5,
184 WINED3D_SM4_RESOURCE_TEXTURE_CUBE = 0x6,
185 WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY = 0x7,
186 WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY = 0x8,
187 WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY = 0x9,
190 enum wined3d_sm4_data_type
192 WINED3D_SM4_DATA_UNORM = 0x1,
193 WINED3D_SM4_DATA_SNORM = 0x2,
194 WINED3D_SM4_DATA_INT = 0x3,
195 WINED3D_SM4_DATA_UINT = 0x4,
196 WINED3D_SM4_DATA_FLOAT = 0x5,
199 struct wined3d_shader_src_param_entry
201 struct list entry;
202 struct wined3d_shader_src_param param;
205 struct wined3d_sm4_data
207 struct wined3d_shader_version shader_version;
208 const DWORD *end;
210 struct
212 enum wined3d_shader_register_type register_type;
213 UINT register_idx;
214 } output_map[MAX_REG_OUTPUT];
216 struct wined3d_shader_src_param src_param[5];
217 struct wined3d_shader_dst_param dst_param[2];
218 struct list src_free;
219 struct list src;
222 struct wined3d_sm4_opcode_info
224 enum wined3d_sm4_opcode opcode;
225 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
226 const char *dst_info;
227 const char *src_info;
230 struct sysval_map
232 enum wined3d_sysval_semantic sysval;
233 enum wined3d_shader_register_type register_type;
234 UINT register_idx;
238 * F -> WINED3D_DATA_FLOAT
239 * I -> WINED3D_DATA_INT
240 * R -> WINED3D_DATA_RESOURCE
241 * S -> WINED3D_DATA_SAMPLER
242 * U -> WINED3D_DATA_UINT
244 static const struct wined3d_sm4_opcode_info opcode_table[] =
246 {WINED3D_SM4_OP_ADD, WINED3DSIH_ADD, "F", "FF"},
247 {WINED3D_SM4_OP_AND, WINED3DSIH_AND, "U", "UU"},
248 {WINED3D_SM4_OP_BREAK, WINED3DSIH_BREAK, "", ""},
249 {WINED3D_SM4_OP_BREAKC, WINED3DSIH_BREAKP, "", "U"},
250 {WINED3D_SM4_OP_CUT, WINED3DSIH_CUT, "", ""},
251 {WINED3D_SM4_OP_DERIV_RTX, WINED3DSIH_DSX, "F", "F"},
252 {WINED3D_SM4_OP_DERIV_RTY, WINED3DSIH_DSY, "F", "F"},
253 {WINED3D_SM4_OP_DISCARD, WINED3DSIH_TEXKILL, "", "U"},
254 {WINED3D_SM4_OP_DIV, WINED3DSIH_DIV, "F", "FF"},
255 {WINED3D_SM4_OP_DP2, WINED3DSIH_DP2, "F", "FF"},
256 {WINED3D_SM4_OP_DP3, WINED3DSIH_DP3, "F", "FF"},
257 {WINED3D_SM4_OP_DP4, WINED3DSIH_DP4, "F", "FF"},
258 {WINED3D_SM4_OP_EMIT, WINED3DSIH_EMIT, "", ""},
259 {WINED3D_SM4_OP_ENDIF, WINED3DSIH_ENDIF, "", ""},
260 {WINED3D_SM4_OP_ENDLOOP, WINED3DSIH_ENDLOOP, "", ""},
261 {WINED3D_SM4_OP_EQ, WINED3DSIH_EQ, "U", "FF"},
262 {WINED3D_SM4_OP_EXP, WINED3DSIH_EXP, "F", "F"},
263 {WINED3D_SM4_OP_FRC, WINED3DSIH_FRC, "F", "F"},
264 {WINED3D_SM4_OP_FTOI, WINED3DSIH_FTOI, "I", "F"},
265 {WINED3D_SM4_OP_GE, WINED3DSIH_GE, "U", "FF"},
266 {WINED3D_SM4_OP_IADD, WINED3DSIH_IADD, "I", "II"},
267 {WINED3D_SM4_OP_IF, WINED3DSIH_IF, "", "U"},
268 {WINED3D_SM4_OP_IEQ, WINED3DSIH_IEQ, "U", "II"},
269 {WINED3D_SM4_OP_IGE, WINED3DSIH_IGE, "U", "II"},
270 {WINED3D_SM4_OP_IMUL, WINED3DSIH_IMUL, "II", "II"},
271 {WINED3D_SM4_OP_ISHL, WINED3DSIH_ISHL, "I", "II"},
272 {WINED3D_SM4_OP_ITOF, WINED3DSIH_ITOF, "F", "I"},
273 {WINED3D_SM4_OP_LD, WINED3DSIH_LD, "U", "FR"},
274 {WINED3D_SM4_OP_LOG, WINED3DSIH_LOG, "F", "F"},
275 {WINED3D_SM4_OP_LOOP, WINED3DSIH_LOOP, "", ""},
276 {WINED3D_SM4_OP_LT, WINED3DSIH_LT, "U", "FF"},
277 {WINED3D_SM4_OP_MAD, WINED3DSIH_MAD, "F", "FFF"},
278 {WINED3D_SM4_OP_MIN, WINED3DSIH_MIN, "F", "FF"},
279 {WINED3D_SM4_OP_MAX, WINED3DSIH_MAX, "F", "FF"},
280 {WINED3D_SM4_OP_MOV, WINED3DSIH_MOV, "F", "F"},
281 {WINED3D_SM4_OP_MOVC, WINED3DSIH_MOVC, "F", "UFF"},
282 {WINED3D_SM4_OP_MUL, WINED3DSIH_MUL, "F", "FF"},
283 {WINED3D_SM4_OP_NE, WINED3DSIH_NE, "U", "FF"},
284 {WINED3D_SM4_OP_OR, WINED3DSIH_OR, "U", "UU"},
285 {WINED3D_SM4_OP_RET, WINED3DSIH_RET, "", ""},
286 {WINED3D_SM4_OP_ROUND_NI, WINED3DSIH_ROUND_NI, "F", "F"},
287 {WINED3D_SM4_OP_RSQ, WINED3DSIH_RSQ, "F", "F"},
288 {WINED3D_SM4_OP_SAMPLE, WINED3DSIH_SAMPLE, "U", "FRS"},
289 {WINED3D_SM4_OP_SAMPLE_LOD, WINED3DSIH_SAMPLE_LOD, "U", "FRSF"},
290 {WINED3D_SM4_OP_SAMPLE_GRAD, WINED3DSIH_SAMPLE_GRAD, "U", "FRSFF"},
291 {WINED3D_SM4_OP_SQRT, WINED3DSIH_SQRT, "F", "F"},
292 {WINED3D_SM4_OP_SINCOS, WINED3DSIH_SINCOS, "FF", "F"},
293 {WINED3D_SM4_OP_UDIV, WINED3DSIH_UDIV, "UU", "UU"},
294 {WINED3D_SM4_OP_UGE, WINED3DSIH_UGE, "U", "UU"},
295 {WINED3D_SM4_OP_USHR, WINED3DSIH_USHR, "U", "UU"},
296 {WINED3D_SM4_OP_UTOF, WINED3DSIH_UTOF, "F", "U"},
297 {WINED3D_SM4_OP_XOR, WINED3DSIH_XOR, "U", "UU"},
298 {WINED3D_SM4_OP_DCL_RESOURCE, WINED3DSIH_DCL, "R", ""},
299 {WINED3D_SM4_OP_DCL_CONSTANT_BUFFER, WINED3DSIH_DCL_CONSTANT_BUFFER, "", ""},
300 {WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY, WINED3DSIH_DCL_OUTPUT_TOPOLOGY, "", ""},
301 {WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE, WINED3DSIH_DCL_INPUT_PRIMITIVE, "", ""},
302 {WINED3D_SM4_OP_DCL_VERTICES_OUT, WINED3DSIH_DCL_VERTICES_OUT, "", ""},
305 static const enum wined3d_shader_register_type register_type_table[] =
307 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP,
308 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT,
309 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT,
310 /* UNKNOWN */ 0,
311 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST,
312 /* UNKNOWN */ 0,
313 /* WINED3D_SM4_RT_SAMPLER */ WINED3DSPR_SAMPLER,
314 /* WINED3D_SM4_RT_RESOURCE */ WINED3DSPR_RESOURCE,
315 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER,
316 /* UNKNOWN */ 0,
317 /* UNKNOWN */ 0,
318 /* WINED3D_SM4_RT_PRIMID */ WINED3DSPR_PRIMID,
319 /* UNKNOWN */ 0,
320 /* WINED3D_SM4_RT_NULL */ WINED3DSPR_NULL,
323 static const enum wined3d_primitive_type output_primitive_type_table[] =
325 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
326 /* WINED3D_SM4_OUTPUT_PT_POINTLIST */ WINED3D_PT_POINTLIST,
327 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
328 /* WINED3D_SM4_OUTPUT_PT_LINELIST */ WINED3D_PT_LINELIST,
329 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
330 /* WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP */ WINED3D_PT_TRIANGLESTRIP,
333 static const enum wined3d_primitive_type input_primitive_type_table[] =
335 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
336 /* WINED3D_SM4_INPUT_PT_POINT */ WINED3D_PT_POINTLIST,
337 /* WINED3D_SM4_INPUT_PT_LINE */ WINED3D_PT_LINELIST,
338 /* WINED3D_SM4_INPUT_PT_TRIANGLE */ WINED3D_PT_TRIANGLELIST,
339 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
340 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
341 /* WINED3D_SM4_INPUT_PT_LINEADJ */ WINED3D_PT_LINELIST_ADJ,
342 /* WINED3D_SM4_INPUT_PT_TRIANGLEADJ */ WINED3D_PT_TRIANGLELIST_ADJ,
345 static const struct sysval_map sysval_map[] =
347 {WINED3D_SV_DEPTH, WINED3DSPR_DEPTHOUT, 0},
348 {WINED3D_SV_TARGET0, WINED3DSPR_COLOROUT, 0},
349 {WINED3D_SV_TARGET1, WINED3DSPR_COLOROUT, 1},
350 {WINED3D_SV_TARGET2, WINED3DSPR_COLOROUT, 2},
351 {WINED3D_SV_TARGET3, WINED3DSPR_COLOROUT, 3},
352 {WINED3D_SV_TARGET4, WINED3DSPR_COLOROUT, 4},
353 {WINED3D_SV_TARGET5, WINED3DSPR_COLOROUT, 5},
354 {WINED3D_SV_TARGET6, WINED3DSPR_COLOROUT, 6},
355 {WINED3D_SV_TARGET7, WINED3DSPR_COLOROUT, 7},
358 static const enum wined3d_shader_resource_type resource_type_table[] =
360 /* 0 */ WINED3D_SHADER_RESOURCE_NONE,
361 /* WINED3D_SM4_RESOURCE_BUFFER */ WINED3D_SHADER_RESOURCE_BUFFER,
362 /* WINED3D_SM4_RESOURCE_TEXTURE_1D */ WINED3D_SHADER_RESOURCE_TEXTURE_1D,
363 /* WINED3D_SM4_RESOURCE_TEXTURE_2D */ WINED3D_SHADER_RESOURCE_TEXTURE_2D,
364 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMS */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMS,
365 /* WINED3D_SM4_RESOURCE_TEXTURE_3D */ WINED3D_SHADER_RESOURCE_TEXTURE_3D,
366 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBE */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBE,
367 /* WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_1DARRAY,
368 /* WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DARRAY,
369 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY,
372 static const enum wined3d_data_type data_type_table[] =
374 /* 0 */ WINED3D_DATA_FLOAT,
375 /* WINED3D_SM4_DATA_UNORM */ WINED3D_DATA_UNORM,
376 /* WINED3D_SM4_DATA_SNORM */ WINED3D_DATA_SNORM,
377 /* WINED3D_SM4_DATA_INT */ WINED3D_DATA_INT,
378 /* WINED3D_SM4_DATA_UINT */ WINED3D_DATA_UINT,
379 /* WINED3D_SM4_DATA_FLOAT */ WINED3D_DATA_FLOAT,
382 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
383 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param);
385 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
387 unsigned int i;
389 for (i = 0; i < sizeof(opcode_table) / sizeof(*opcode_table); ++i)
391 if (opcode == opcode_table[i].opcode) return &opcode_table[i];
394 return NULL;
397 static void map_register(const struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
399 switch (priv->shader_version.type)
401 case WINED3D_SHADER_TYPE_PIXEL:
402 if (reg->type == WINED3DSPR_OUTPUT)
404 unsigned int reg_idx = reg->idx[0].offset;
406 if (reg_idx >= ARRAY_SIZE(priv->output_map))
408 ERR("Invalid output index %u.\n", reg_idx);
409 break;
412 reg->type = priv->output_map[reg_idx].register_type;
413 reg->idx[0].offset = priv->output_map[reg_idx].register_idx;
415 break;
417 default:
418 break;
422 static enum wined3d_data_type map_data_type(char t)
424 switch (t)
426 case 'F':
427 return WINED3D_DATA_FLOAT;
428 case 'I':
429 return WINED3D_DATA_INT;
430 case 'R':
431 return WINED3D_DATA_RESOURCE;
432 case 'S':
433 return WINED3D_DATA_SAMPLER;
434 case 'U':
435 return WINED3D_DATA_UINT;
436 default:
437 ERR("Invalid data type '%c'.\n", t);
438 return WINED3D_DATA_FLOAT;
442 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
444 struct wined3d_sm4_data *priv;
445 unsigned int i, j;
447 if (!(priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv))))
449 ERR("Failed to allocate private data\n");
450 return NULL;
453 memset(priv->output_map, 0xff, sizeof(priv->output_map));
454 for (i = 0; i < output_signature->element_count; ++i)
456 struct wined3d_shader_signature_element *e = &output_signature->elements[i];
458 if (e->register_idx >= ARRAY_SIZE(priv->output_map))
460 WARN("Invalid output index %u.\n", e->register_idx);
461 continue;
464 for (j = 0; j < ARRAY_SIZE(sysval_map); ++j)
466 if (e->sysval_semantic == sysval_map[j].sysval)
468 priv->output_map[e->register_idx].register_type = sysval_map[j].register_type;
469 priv->output_map[e->register_idx].register_idx = sysval_map[j].register_idx;
470 break;
475 list_init(&priv->src_free);
476 list_init(&priv->src);
478 return priv;
481 static void shader_sm4_free(void *data)
483 struct wined3d_shader_src_param_entry *e1, *e2;
484 struct wined3d_sm4_data *priv = data;
486 list_move_head(&priv->src_free, &priv->src);
487 LIST_FOR_EACH_ENTRY_SAFE(e1, e2, &priv->src_free, struct wined3d_shader_src_param_entry, entry)
489 HeapFree(GetProcessHeap(), 0, e1);
491 HeapFree(GetProcessHeap(), 0, priv);
494 static struct wined3d_shader_src_param *get_src_param(struct wined3d_sm4_data *priv)
496 struct wined3d_shader_src_param_entry *e;
497 struct list *elem;
499 if (!list_empty(&priv->src_free))
501 elem = list_head(&priv->src_free);
502 list_remove(elem);
504 else
506 if (!(e = HeapAlloc(GetProcessHeap(), 0, sizeof(*e))))
507 return NULL;
508 elem = &e->entry;
511 list_add_tail(&priv->src, elem);
512 e = LIST_ENTRY(elem, struct wined3d_shader_src_param_entry, entry);
513 return &e->param;
516 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
518 struct wined3d_sm4_data *priv = data;
519 DWORD version_token;
521 priv->end = *ptr;
523 version_token = *(*ptr)++;
524 TRACE("version: 0x%08x\n", version_token);
526 TRACE("token count: %u\n", **ptr);
527 priv->end += *(*ptr)++;
529 switch (version_token >> 16)
531 case WINED3D_SM4_PS:
532 priv->shader_version.type = WINED3D_SHADER_TYPE_PIXEL;
533 break;
535 case WINED3D_SM4_VS:
536 priv->shader_version.type = WINED3D_SHADER_TYPE_VERTEX;
537 break;
539 case WINED3D_SM4_GS:
540 priv->shader_version.type = WINED3D_SHADER_TYPE_GEOMETRY;
541 break;
543 default:
544 FIXME("Unrecognized shader type %#x\n", version_token >> 16);
546 priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
547 priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
549 *shader_version = priv->shader_version;
552 static BOOL shader_sm4_read_reg_idx(struct wined3d_sm4_data *priv, const DWORD **ptr,
553 DWORD addressing, struct wined3d_shader_register_index *reg_idx)
555 if (addressing & WINED3D_SM4_ADDRESSING_RELATIVE)
557 struct wined3d_shader_src_param *rel_addr = get_src_param(priv);
559 if (!(reg_idx->rel_addr = rel_addr))
561 ERR("Failed to get src param for relative addressing.\n");
562 return FALSE;
565 if (addressing & WINED3D_SM4_ADDRESSING_OFFSET)
566 reg_idx->offset = *(*ptr)++;
567 else
568 reg_idx->offset = 0;
569 shader_sm4_read_src_param(priv, ptr, WINED3D_DATA_INT, rel_addr);
571 else
573 reg_idx->rel_addr = NULL;
574 reg_idx->offset = *(*ptr)++;
577 return TRUE;
580 static BOOL shader_sm4_read_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
581 enum wined3d_data_type data_type, struct wined3d_shader_register *param,
582 enum wined3d_shader_src_modifier *modifier)
584 enum wined3d_sm4_register_type register_type;
585 DWORD token = *(*ptr)++;
586 DWORD order;
588 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
589 if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
591 FIXME("Unhandled register type %#x.\n", register_type);
592 param->type = WINED3DSPR_TEMP;
594 else
596 param->type = register_type_table[register_type];
598 param->data_type = data_type;
600 if (token & WINED3D_SM4_REGISTER_MODIFIER)
602 DWORD m = *(*ptr)++;
604 /* FIXME: This will probably break down at some point. The SM4
605 * modifiers look like flags, while wined3d currently has an enum
606 * with possible combinations, e.g. WINED3DSPSM_ABSNEG. */
607 switch (m)
609 case 0x41:
610 *modifier = WINED3DSPSM_NEG;
611 break;
613 case 0x81:
614 *modifier = WINED3DSPSM_ABS;
615 break;
617 default:
618 FIXME("Skipping modifier 0x%08x.\n", m);
619 *modifier = WINED3DSPSM_NONE;
620 break;
623 else
625 *modifier = WINED3DSPSM_NONE;
628 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
630 if (order < 1)
631 param->idx[0].offset = ~0U;
632 else
634 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK0) >> WINED3D_SM4_ADDRESSING_SHIFT0;
635 if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[0])))
637 ERR("Failed to read register index.\n");
638 return FALSE;
642 if (order < 2)
643 param->idx[1].offset = ~0U;
644 else
646 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK1) >> WINED3D_SM4_ADDRESSING_SHIFT1;
647 if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[1])))
649 ERR("Failed to read register index.\n");
650 return FALSE;
654 if (order > 2)
655 FIXME("Unhandled order %u.\n", order);
657 if (register_type == WINED3D_SM4_RT_IMMCONST)
659 enum wined3d_sm4_immconst_type immconst_type =
660 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
662 switch (immconst_type)
664 case WINED3D_SM4_IMMCONST_SCALAR:
665 param->immconst_type = WINED3D_IMMCONST_SCALAR;
666 memcpy(param->immconst_data, *ptr, 1 * sizeof(DWORD));
667 *ptr += 1;
668 break;
670 case WINED3D_SM4_IMMCONST_VEC4:
671 param->immconst_type = WINED3D_IMMCONST_VEC4;
672 memcpy(param->immconst_data, *ptr, 4 * sizeof(DWORD));
673 *ptr += 4;
674 break;
676 default:
677 FIXME("Unhandled immediate constant type %#x.\n", immconst_type);
678 break;
682 map_register(priv, param);
684 return TRUE;
687 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
688 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param)
690 DWORD token = **ptr;
692 if (!shader_sm4_read_param(priv, ptr, data_type, &src_param->reg, &src_param->modifiers))
694 ERR("Failed to read parameter.\n");
695 return FALSE;
698 if (src_param->reg.type == WINED3DSPR_IMMCONST)
700 src_param->swizzle = WINED3DSP_NOSWIZZLE;
702 else
704 enum wined3d_sm4_swizzle_type swizzle_type =
705 (token & WINED3D_SM4_SWIZZLE_TYPE_MASK) >> WINED3D_SM4_SWIZZLE_TYPE_SHIFT;
707 switch (swizzle_type)
709 case WINED3D_SM4_SWIZZLE_SCALAR:
710 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
711 src_param->swizzle = (src_param->swizzle & 0x3) * 0x55;
712 break;
714 case WINED3D_SM4_SWIZZLE_VEC4:
715 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
716 break;
718 default:
719 FIXME("Unhandled swizzle type %#x.\n", swizzle_type);
720 break;
724 return TRUE;
727 static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
728 enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param)
730 enum wined3d_shader_src_modifier modifier;
731 DWORD token = **ptr;
733 if (!shader_sm4_read_param(priv, ptr, data_type, &dst_param->reg, &modifier))
735 ERR("Failed to read parameter.\n");
736 return FALSE;
739 if (modifier != WINED3DSPSM_NONE)
741 ERR("Invalid source modifier %#x on destination register.\n", modifier);
742 return FALSE;
745 dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
746 dst_param->modifiers = 0;
747 dst_param->shift = 0;
749 return TRUE;
752 static void shader_sm4_read_instruction(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins)
754 const struct wined3d_sm4_opcode_info *opcode_info;
755 struct wined3d_sm4_data *priv = data;
756 DWORD opcode_token, opcode;
757 const DWORD *p;
758 UINT i, len;
760 list_move_head(&priv->src_free, &priv->src);
762 opcode_token = *(*ptr)++;
763 opcode = opcode_token & WINED3D_SM4_OPCODE_MASK;
764 len = ((opcode_token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT) - 1;
766 if (TRACE_ON(d3d_bytecode))
768 TRACE_(d3d_bytecode)("[ %08x ", opcode_token);
769 for (i = 0; i < len; ++i)
771 TRACE_(d3d_bytecode)("%08x ", (*ptr)[i]);
773 TRACE_(d3d_bytecode)("]\n");
776 if (!(opcode_info = get_opcode_info(opcode)))
778 FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode, opcode_token);
779 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
780 *ptr += len;
781 return;
784 ins->handler_idx = opcode_info->handler_idx;
785 ins->flags = 0;
786 ins->coissue = 0;
787 ins->predicate = NULL;
788 ins->dst_count = strlen(opcode_info->dst_info);
789 ins->dst = priv->dst_param;
790 ins->src_count = strlen(opcode_info->src_info);
791 ins->src = priv->src_param;
793 p = *ptr;
794 *ptr += len;
796 if (opcode_token & WINED3D_SM4_INSTRUCTION_MODIFIER)
798 DWORD modifier = *p++;
799 FIXME("Skipping modifier 0x%08x.\n", modifier);
802 if (opcode == WINED3D_SM4_OP_DCL_RESOURCE)
804 enum wined3d_sm4_resource_type resource_type;
805 enum wined3d_sm4_data_type data_type;
806 DWORD components;
808 resource_type = (opcode_token & WINED3D_SM4_RESOURCE_TYPE_MASK) >> WINED3D_SM4_RESOURCE_TYPE_SHIFT;
809 if (!resource_type || (resource_type >= ARRAY_SIZE(resource_type_table)))
811 FIXME("Unhandled resource type %#x.\n", resource_type);
812 ins->declaration.semantic.resource_type = WINED3D_SHADER_RESOURCE_NONE;
814 else
816 ins->declaration.semantic.resource_type = resource_type_table[resource_type];
818 shader_sm4_read_dst_param(priv, &p, WINED3D_DATA_RESOURCE, &ins->declaration.semantic.reg);
820 components = *p++;
821 if ((components & 0xfff0) != (components & 0xf) * 0x1110)
822 FIXME("Components (%#x) have different data types.\n", components);
823 data_type = components & 0xf;
825 if (!data_type || (data_type >= ARRAY_SIZE(data_type_table)))
827 FIXME("Unhandled data type %#x.\n", data_type);
828 ins->declaration.semantic.resource_data_type = WINED3D_DATA_FLOAT;
830 else
832 ins->declaration.semantic.resource_data_type = data_type_table[data_type];
835 else if (opcode == WINED3D_SM4_OP_DCL_CONSTANT_BUFFER)
837 shader_sm4_read_src_param(priv, &p, WINED3D_DATA_FLOAT, &ins->declaration.src);
838 if (opcode_token & WINED3D_SM4_INDEX_TYPE_MASK)
839 ins->flags |= WINED3DSI_INDEXED_DYNAMIC;
841 else if (opcode == WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY)
843 enum wined3d_sm4_output_primitive_type primitive_type;
845 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
846 if (primitive_type >= sizeof(output_primitive_type_table) / sizeof(*output_primitive_type_table))
848 FIXME("Unhandled output primitive type %#x.\n", primitive_type);
849 ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
851 else
853 ins->declaration.primitive_type = output_primitive_type_table[primitive_type];
856 else if (opcode == WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE)
858 enum wined3d_sm4_input_primitive_type primitive_type;
860 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
861 if (primitive_type >= sizeof(input_primitive_type_table) / sizeof(*input_primitive_type_table))
863 FIXME("Unhandled input primitive type %#x.\n", primitive_type);
864 ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
866 else
868 ins->declaration.primitive_type = input_primitive_type_table[primitive_type];
871 else if (opcode == WINED3D_SM4_OP_DCL_VERTICES_OUT)
873 ins->declaration.count = *p++;
875 else
877 for (i = 0; i < ins->dst_count; ++i)
879 if (!(shader_sm4_read_dst_param(priv, &p, map_data_type(opcode_info->dst_info[i]), &priv->dst_param[i])))
881 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
882 return;
886 for (i = 0; i < ins->src_count; ++i)
888 if (!(shader_sm4_read_src_param(priv, &p, map_data_type(opcode_info->src_info[i]), &priv->src_param[i])))
890 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
891 return;
897 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
899 struct wined3d_sm4_data *priv = data;
900 return *ptr == priv->end;
903 const struct wined3d_shader_frontend sm4_shader_frontend =
905 shader_sm4_init,
906 shader_sm4_free,
907 shader_sm4_read_header,
908 shader_sm4_read_instruction,
909 shader_sm4_is_end,