d3d8/tests: Add a system memory miptree layout test.
[wine.git] / dlls / wined3d / shader_sm4.c
blob59336265286306176a1857fbe15c3fad329deb2b
1 /*
2 * Copyright 2009 Henri Verbeet for CodeWeavers
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
19 #include "config.h"
20 #include "wine/port.h"
22 #include "wined3d_private.h"
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
25 WINE_DECLARE_DEBUG_CHANNEL(d3d_bytecode);
27 #define WINED3D_SM4_INSTRUCTION_MODIFIER (0x1u << 31)
29 #define WINED3D_SM4_MODIFIER_AOFFIMMI 0x1
30 #define WINED3D_SM4_AOFFIMMI_U_SHIFT 9
31 #define WINED3D_SM4_AOFFIMMI_U_MASK (0xfu << WINED3D_SM4_AOFFIMMI_U_SHIFT)
32 #define WINED3D_SM4_AOFFIMMI_V_SHIFT 13
33 #define WINED3D_SM4_AOFFIMMI_V_MASK (0xfu << WINED3D_SM4_AOFFIMMI_V_SHIFT)
34 #define WINED3D_SM4_AOFFIMMI_W_SHIFT 17
35 #define WINED3D_SM4_AOFFIMMI_W_MASK (0xfu << WINED3D_SM4_AOFFIMMI_W_SHIFT)
37 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
38 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0x1fu << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
40 #define WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT 11
41 #define WINED3D_SM4_INSTRUCTION_FLAGS_MASK (0x7u << WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT)
43 #define WINED3D_SM4_RESOURCE_TYPE_SHIFT 11
44 #define WINED3D_SM4_RESOURCE_TYPE_MASK (0xfu << WINED3D_SM4_RESOURCE_TYPE_SHIFT)
46 #define WINED3D_SM4_PRIMITIVE_TYPE_SHIFT 11
47 #define WINED3D_SM4_PRIMITIVE_TYPE_MASK (0x7u << WINED3D_SM4_PRIMITIVE_TYPE_SHIFT)
49 #define WINED3D_SM4_INDEX_TYPE_SHIFT 11
50 #define WINED3D_SM4_INDEX_TYPE_MASK (0x1u << WINED3D_SM4_INDEX_TYPE_SHIFT)
52 #define WINED3D_SM4_SAMPLER_MODE_SHIFT 11
53 #define WINED3D_SM4_SAMPLER_MODE_MASK (0xfu << WINED3D_SM4_SAMPLER_MODE_SHIFT)
55 #define WINED3D_SM4_SHADER_DATA_TYPE_SHIFT 11
56 #define WINED3D_SM4_SHADER_DATA_TYPE_MASK (0xfu << WINED3D_SM4_SHADER_DATA_TYPE_SHIFT)
58 #define WINED3D_SM4_INTERPOLATION_MODE_SHIFT 11
59 #define WINED3D_SM4_INTERPOLATION_MODE_MASK (0xfu << WINED3D_SM4_INTERPOLATION_MODE_SHIFT)
61 #define WINED3D_SM4_GLOBAL_FLAGS_SHIFT 11
62 #define WINED3D_SM4_GLOBAL_FLAGS_MASK (0xffu << WINED3D_SM4_GLOBAL_FLAGS_SHIFT)
64 #define WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT 11
65 #define WINED3D_SM5_CONTROL_POINT_COUNT_MASK (0xffu << WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT)
67 #define WINED3D_SM5_TESSELLATOR_SHIFT 11
68 #define WINED3D_SM5_TESSELLATOR_MASK (0xfu << WINED3D_SM5_TESSELLATOR_SHIFT)
70 #define WINED3D_SM4_OPCODE_MASK 0xff
72 #define WINED3D_SM4_REGISTER_MODIFIER (0x1u << 31)
74 #define WINED3D_SM4_ADDRESSING_SHIFT1 25
75 #define WINED3D_SM4_ADDRESSING_MASK1 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT1)
77 #define WINED3D_SM4_ADDRESSING_SHIFT0 22
78 #define WINED3D_SM4_ADDRESSING_MASK0 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT0)
80 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
81 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3u << WINED3D_SM4_REGISTER_ORDER_SHIFT)
83 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
84 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xffu << WINED3D_SM4_REGISTER_TYPE_SHIFT)
86 #define WINED3D_SM4_SWIZZLE_TYPE_SHIFT 2
87 #define WINED3D_SM4_SWIZZLE_TYPE_MASK (0x3u << WINED3D_SM4_SWIZZLE_TYPE_SHIFT)
89 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT 0
90 #define WINED3D_SM4_IMMCONST_TYPE_MASK (0x3u << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
92 #define WINED3D_SM4_WRITEMASK_SHIFT 4
93 #define WINED3D_SM4_WRITEMASK_MASK (0xfu << WINED3D_SM4_WRITEMASK_SHIFT)
95 #define WINED3D_SM4_SWIZZLE_SHIFT 4
96 #define WINED3D_SM4_SWIZZLE_MASK (0xffu << WINED3D_SM4_SWIZZLE_SHIFT)
98 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
99 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
101 #define WINED3D_SM4_ADDRESSING_RELATIVE 0x2
102 #define WINED3D_SM4_ADDRESSING_OFFSET 0x1
104 #define WINED3D_SM4_INSTRUCTION_FLAG_SATURATE 0x4
106 enum wined3d_sm4_opcode
108 WINED3D_SM4_OP_ADD = 0x00,
109 WINED3D_SM4_OP_AND = 0x01,
110 WINED3D_SM4_OP_BREAK = 0x02,
111 WINED3D_SM4_OP_BREAKC = 0x03,
112 WINED3D_SM4_OP_CUT = 0x09,
113 WINED3D_SM4_OP_DERIV_RTX = 0x0b,
114 WINED3D_SM4_OP_DERIV_RTY = 0x0c,
115 WINED3D_SM4_OP_DISCARD = 0x0d,
116 WINED3D_SM4_OP_DIV = 0x0e,
117 WINED3D_SM4_OP_DP2 = 0x0f,
118 WINED3D_SM4_OP_DP3 = 0x10,
119 WINED3D_SM4_OP_DP4 = 0x11,
120 WINED3D_SM4_OP_ELSE = 0x12,
121 WINED3D_SM4_OP_EMIT = 0x13,
122 WINED3D_SM4_OP_ENDIF = 0x15,
123 WINED3D_SM4_OP_ENDLOOP = 0x16,
124 WINED3D_SM4_OP_EQ = 0x18,
125 WINED3D_SM4_OP_EXP = 0x19,
126 WINED3D_SM4_OP_FRC = 0x1a,
127 WINED3D_SM4_OP_FTOI = 0x1b,
128 WINED3D_SM4_OP_FTOU = 0x1c,
129 WINED3D_SM4_OP_GE = 0x1d,
130 WINED3D_SM4_OP_IADD = 0x1e,
131 WINED3D_SM4_OP_IF = 0x1f,
132 WINED3D_SM4_OP_IEQ = 0x20,
133 WINED3D_SM4_OP_IGE = 0x21,
134 WINED3D_SM4_OP_ILT = 0x22,
135 WINED3D_SM4_OP_IMAD = 0x23,
136 WINED3D_SM4_OP_IMAX = 0x24,
137 WINED3D_SM4_OP_IMIN = 0x25,
138 WINED3D_SM4_OP_IMUL = 0x26,
139 WINED3D_SM4_OP_INE = 0x27,
140 WINED3D_SM4_OP_INEG = 0x28,
141 WINED3D_SM4_OP_ISHL = 0x29,
142 WINED3D_SM4_OP_ITOF = 0x2b,
143 WINED3D_SM4_OP_LD = 0x2d,
144 WINED3D_SM4_OP_LD2DMS = 0x2e,
145 WINED3D_SM4_OP_LOG = 0x2f,
146 WINED3D_SM4_OP_LOOP = 0x30,
147 WINED3D_SM4_OP_LT = 0x31,
148 WINED3D_SM4_OP_MAD = 0x32,
149 WINED3D_SM4_OP_MIN = 0x33,
150 WINED3D_SM4_OP_MAX = 0x34,
151 WINED3D_SM4_OP_SHADER_DATA = 0x35,
152 WINED3D_SM4_OP_MOV = 0x36,
153 WINED3D_SM4_OP_MOVC = 0x37,
154 WINED3D_SM4_OP_MUL = 0x38,
155 WINED3D_SM4_OP_NE = 0x39,
156 WINED3D_SM4_OP_NOT = 0x3b,
157 WINED3D_SM4_OP_OR = 0x3c,
158 WINED3D_SM4_OP_RESINFO = 0x3d,
159 WINED3D_SM4_OP_RET = 0x3e,
160 WINED3D_SM4_OP_ROUND_NI = 0x41,
161 WINED3D_SM4_OP_ROUND_PI = 0x42,
162 WINED3D_SM4_OP_ROUND_Z = 0x43,
163 WINED3D_SM4_OP_RSQ = 0x44,
164 WINED3D_SM4_OP_SAMPLE = 0x45,
165 WINED3D_SM4_OP_SAMPLE_C = 0x46,
166 WINED3D_SM4_OP_SAMPLE_C_LZ = 0x47,
167 WINED3D_SM4_OP_SAMPLE_LOD = 0x48,
168 WINED3D_SM4_OP_SAMPLE_GRAD = 0x49,
169 WINED3D_SM4_OP_SAMPLE_B = 0x4a,
170 WINED3D_SM4_OP_SQRT = 0x4b,
171 WINED3D_SM4_OP_SINCOS = 0x4d,
172 WINED3D_SM4_OP_UDIV = 0x4e,
173 WINED3D_SM4_OP_ULT = 0x4f,
174 WINED3D_SM4_OP_UGE = 0x50,
175 WINED3D_SM4_OP_USHR = 0x55,
176 WINED3D_SM4_OP_UTOF = 0x56,
177 WINED3D_SM4_OP_XOR = 0x57,
178 WINED3D_SM4_OP_DCL_RESOURCE = 0x58,
179 WINED3D_SM4_OP_DCL_CONSTANT_BUFFER = 0x59,
180 WINED3D_SM4_OP_DCL_SAMPLER = 0x5a,
181 WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY = 0x5c,
182 WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE = 0x5d,
183 WINED3D_SM4_OP_DCL_VERTICES_OUT = 0x5e,
184 WINED3D_SM4_OP_DCL_INPUT = 0x5f,
185 WINED3D_SM4_OP_DCL_INPUT_SGV = 0x60,
186 WINED3D_SM4_OP_DCL_INPUT_SIV = 0x61,
187 WINED3D_SM4_OP_DCL_INPUT_PS = 0x62,
188 WINED3D_SM4_OP_DCL_INPUT_PS_SGV = 0x63,
189 WINED3D_SM4_OP_DCL_INPUT_PS_SIV = 0x64,
190 WINED3D_SM4_OP_DCL_OUTPUT = 0x65,
191 WINED3D_SM4_OP_DCL_OUTPUT_SIV = 0x67,
192 WINED3D_SM4_OP_DCL_TEMPS = 0x68,
193 WINED3D_SM4_OP_DCL_GLOBAL_FLAGS = 0x6a,
194 WINED3D_SM5_OP_HS_DECLS = 0x71,
195 WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE = 0x72,
196 WINED3D_SM5_OP_HS_FORK_PHASE = 0x73,
197 WINED3D_SM5_OP_HS_JOIN_PHASE = 0x74,
198 WINED3D_SM5_OP_DERIV_RTX_COARSE = 0x7a,
199 WINED3D_SM5_OP_DERIV_RTX_FINE = 0x7b,
200 WINED3D_SM5_OP_DERIV_RTY_COARSE = 0x7c,
201 WINED3D_SM5_OP_DERIV_RTY_FINE = 0x7d,
202 WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT = 0x93,
203 WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT = 0x94,
204 WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN = 0x95,
205 WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING = 0x96,
206 WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE = 0x97,
207 WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR = 0x98,
208 WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT = 0x99,
209 WINED3D_SM5_OP_DCL_UAV_TYPED = 0x9c,
210 WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED = 0xa2,
211 WINED3D_SM5_OP_STORE_UAV_TYPED = 0xa4,
212 WINED3D_SM5_OP_LD_STRUCTURED = 0xa7,
215 enum wined3d_sm4_register_type
217 WINED3D_SM4_RT_TEMP = 0x0,
218 WINED3D_SM4_RT_INPUT = 0x1,
219 WINED3D_SM4_RT_OUTPUT = 0x2,
220 WINED3D_SM4_RT_IMMCONST = 0x4,
221 WINED3D_SM4_RT_SAMPLER = 0x6,
222 WINED3D_SM4_RT_RESOURCE = 0x7,
223 WINED3D_SM4_RT_CONSTBUFFER = 0x8,
224 WINED3D_SM4_RT_IMMCONSTBUFFER = 0x9,
225 WINED3D_SM4_RT_PRIMID = 0xb,
226 WINED3D_SM4_RT_DEPTHOUT = 0xc,
227 WINED3D_SM4_RT_NULL = 0xd,
228 WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID = 0x16,
229 WINED3D_SM5_RT_FORK_INSTANCE_ID = 0x17,
230 WINED3D_SM5_RT_INPUT_CONTROL_POINT = 0x19,
231 WINED3D_SM5_RT_PATCH_CONSTANT_DATA = 0x1b,
232 WINED3D_SM5_RT_DOMAIN_LOCATION = 0x1c,
233 WINED3D_SM5_RT_UAV = 0x1e,
236 enum wined3d_sm4_output_primitive_type
238 WINED3D_SM4_OUTPUT_PT_POINTLIST = 0x1,
239 WINED3D_SM4_OUTPUT_PT_LINELIST = 0x3,
240 WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP = 0x5,
243 enum wined3d_sm4_input_primitive_type
245 WINED3D_SM4_INPUT_PT_POINT = 0x1,
246 WINED3D_SM4_INPUT_PT_LINE = 0x2,
247 WINED3D_SM4_INPUT_PT_TRIANGLE = 0x3,
248 WINED3D_SM4_INPUT_PT_LINEADJ = 0x6,
249 WINED3D_SM4_INPUT_PT_TRIANGLEADJ = 0x7,
252 enum wined3d_sm4_swizzle_type
254 WINED3D_SM4_SWIZZLE_NONE = 0x0,
255 WINED3D_SM4_SWIZZLE_VEC4 = 0x1,
256 WINED3D_SM4_SWIZZLE_SCALAR = 0x2,
259 enum wined3d_sm4_immconst_type
261 WINED3D_SM4_IMMCONST_SCALAR = 0x1,
262 WINED3D_SM4_IMMCONST_VEC4 = 0x2,
265 enum wined3d_sm4_resource_type
267 WINED3D_SM4_RESOURCE_BUFFER = 0x1,
268 WINED3D_SM4_RESOURCE_TEXTURE_1D = 0x2,
269 WINED3D_SM4_RESOURCE_TEXTURE_2D = 0x3,
270 WINED3D_SM4_RESOURCE_TEXTURE_2DMS = 0x4,
271 WINED3D_SM4_RESOURCE_TEXTURE_3D = 0x5,
272 WINED3D_SM4_RESOURCE_TEXTURE_CUBE = 0x6,
273 WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY = 0x7,
274 WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY = 0x8,
275 WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY = 0x9,
278 enum wined3d_sm4_data_type
280 WINED3D_SM4_DATA_UNORM = 0x1,
281 WINED3D_SM4_DATA_SNORM = 0x2,
282 WINED3D_SM4_DATA_INT = 0x3,
283 WINED3D_SM4_DATA_UINT = 0x4,
284 WINED3D_SM4_DATA_FLOAT = 0x5,
287 enum wined3d_sm4_sampler_mode
289 WINED3D_SM4_SAMPLER_DEFAULT = 0x0,
290 WINED3D_SM4_SAMPLER_COMPARISON = 0x1,
293 enum wined3d_sm4_shader_data_type
295 WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER = 0x3,
296 WINED3D_SM4_SHADER_DATA_MESSAGE = 0x4,
299 struct wined3d_shader_src_param_entry
301 struct list entry;
302 struct wined3d_shader_src_param param;
305 struct wined3d_sm4_data
307 struct wined3d_shader_version shader_version;
308 const DWORD *end;
310 unsigned int output_map[MAX_REG_OUTPUT];
312 struct wined3d_shader_src_param src_param[5];
313 struct wined3d_shader_dst_param dst_param[2];
314 struct list src_free;
315 struct list src;
316 struct wined3d_shader_immediate_constant_buffer icb;
319 struct wined3d_sm4_opcode_info
321 enum wined3d_sm4_opcode opcode;
322 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
323 const char *dst_info;
324 const char *src_info;
325 void (*read_opcode_func)(struct wined3d_shader_instruction *ins,
326 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
327 struct wined3d_sm4_data *priv);
330 static const enum wined3d_primitive_type output_primitive_type_table[] =
332 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
333 /* WINED3D_SM4_OUTPUT_PT_POINTLIST */ WINED3D_PT_POINTLIST,
334 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
335 /* WINED3D_SM4_OUTPUT_PT_LINELIST */ WINED3D_PT_LINELIST,
336 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
337 /* WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP */ WINED3D_PT_TRIANGLESTRIP,
340 static const enum wined3d_primitive_type input_primitive_type_table[] =
342 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
343 /* WINED3D_SM4_INPUT_PT_POINT */ WINED3D_PT_POINTLIST,
344 /* WINED3D_SM4_INPUT_PT_LINE */ WINED3D_PT_LINELIST,
345 /* WINED3D_SM4_INPUT_PT_TRIANGLE */ WINED3D_PT_TRIANGLELIST,
346 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
347 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
348 /* WINED3D_SM4_INPUT_PT_LINEADJ */ WINED3D_PT_LINELIST_ADJ,
349 /* WINED3D_SM4_INPUT_PT_TRIANGLEADJ */ WINED3D_PT_TRIANGLELIST_ADJ,
352 static const enum wined3d_shader_resource_type resource_type_table[] =
354 /* 0 */ WINED3D_SHADER_RESOURCE_NONE,
355 /* WINED3D_SM4_RESOURCE_BUFFER */ WINED3D_SHADER_RESOURCE_BUFFER,
356 /* WINED3D_SM4_RESOURCE_TEXTURE_1D */ WINED3D_SHADER_RESOURCE_TEXTURE_1D,
357 /* WINED3D_SM4_RESOURCE_TEXTURE_2D */ WINED3D_SHADER_RESOURCE_TEXTURE_2D,
358 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMS */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMS,
359 /* WINED3D_SM4_RESOURCE_TEXTURE_3D */ WINED3D_SHADER_RESOURCE_TEXTURE_3D,
360 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBE */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBE,
361 /* WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_1DARRAY,
362 /* WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DARRAY,
363 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY,
366 static const enum wined3d_data_type data_type_table[] =
368 /* 0 */ WINED3D_DATA_FLOAT,
369 /* WINED3D_SM4_DATA_UNORM */ WINED3D_DATA_UNORM,
370 /* WINED3D_SM4_DATA_SNORM */ WINED3D_DATA_SNORM,
371 /* WINED3D_SM4_DATA_INT */ WINED3D_DATA_INT,
372 /* WINED3D_SM4_DATA_UINT */ WINED3D_DATA_UINT,
373 /* WINED3D_SM4_DATA_FLOAT */ WINED3D_DATA_FLOAT,
376 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
377 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param);
378 static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
379 enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param);
381 static void shader_sm4_read_shader_data(struct wined3d_shader_instruction *ins,
382 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
383 struct wined3d_sm4_data *priv)
385 enum wined3d_sm4_shader_data_type type;
386 unsigned int icb_size;
388 type = (opcode_token & WINED3D_SM4_SHADER_DATA_TYPE_MASK) >> WINED3D_SM4_SHADER_DATA_TYPE_SHIFT;
389 if (type != WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER)
391 FIXME("Unhandled shader data type %#x.\n", type);
392 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
393 return;
396 ++tokens;
397 icb_size = token_count - 1;
398 if (icb_size % 4 || icb_size > MAX_IMMEDIATE_CONSTANT_BUFFER_SIZE)
400 FIXME("Unexpected immediate constant buffer size %u.\n", icb_size);
401 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
402 return;
405 priv->icb.element_count = icb_size;
406 memcpy(priv->icb.data, tokens, sizeof(*tokens) * icb_size);
407 ins->declaration.icb = &priv->icb;
410 static void shader_sm4_read_dcl_resource(struct wined3d_shader_instruction *ins,
411 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
412 struct wined3d_sm4_data *priv)
414 enum wined3d_sm4_resource_type resource_type;
415 enum wined3d_sm4_data_type data_type;
416 enum wined3d_data_type reg_data_type;
417 DWORD components;
419 resource_type = (opcode_token & WINED3D_SM4_RESOURCE_TYPE_MASK) >> WINED3D_SM4_RESOURCE_TYPE_SHIFT;
420 if (!resource_type || (resource_type >= ARRAY_SIZE(resource_type_table)))
422 FIXME("Unhandled resource type %#x.\n", resource_type);
423 ins->declaration.semantic.resource_type = WINED3D_SHADER_RESOURCE_NONE;
425 else
427 ins->declaration.semantic.resource_type = resource_type_table[resource_type];
429 reg_data_type = opcode == WINED3D_SM4_OP_DCL_RESOURCE ? WINED3D_DATA_RESOURCE : WINED3D_DATA_UAV;
430 shader_sm4_read_dst_param(priv, &tokens, reg_data_type, &ins->declaration.semantic.reg);
432 components = *tokens++;
433 if ((components & 0xfff0) != (components & 0xf) * 0x1110)
434 FIXME("Components (%#x) have different data types.\n", components);
435 data_type = components & 0xf;
437 if (!data_type || (data_type >= ARRAY_SIZE(data_type_table)))
439 FIXME("Unhandled data type %#x.\n", data_type);
440 ins->declaration.semantic.resource_data_type = WINED3D_DATA_FLOAT;
442 else
444 ins->declaration.semantic.resource_data_type = data_type_table[data_type];
448 static void shader_sm4_read_dcl_constant_buffer(struct wined3d_shader_instruction *ins,
449 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
450 struct wined3d_sm4_data *priv)
452 shader_sm4_read_src_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.src);
453 if (opcode_token & WINED3D_SM4_INDEX_TYPE_MASK)
454 ins->flags |= WINED3DSI_INDEXED_DYNAMIC;
457 static void shader_sm4_read_dcl_sampler(struct wined3d_shader_instruction *ins,
458 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
459 struct wined3d_sm4_data *priv)
461 ins->flags = (opcode_token & WINED3D_SM4_SAMPLER_MODE_MASK) >> WINED3D_SM4_SAMPLER_MODE_SHIFT;
462 if (ins->flags & ~WINED3D_SM4_SAMPLER_COMPARISON)
463 FIXME("Unhandled sampler mode %#x.\n", ins->flags);
464 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_SAMPLER, &ins->declaration.dst);
467 static void shader_sm4_read_dcl_output_topology(struct wined3d_shader_instruction *ins,
468 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
469 struct wined3d_sm4_data *priv)
471 enum wined3d_sm4_output_primitive_type primitive_type;
473 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
474 if (primitive_type >= sizeof(output_primitive_type_table) / sizeof(*output_primitive_type_table))
476 FIXME("Unhandled output primitive type %#x.\n", primitive_type);
477 ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
479 else
481 ins->declaration.primitive_type = output_primitive_type_table[primitive_type];
485 static void shader_sm4_read_dcl_input_primitive(struct wined3d_shader_instruction *ins,
486 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
487 struct wined3d_sm4_data *priv)
489 enum wined3d_sm4_input_primitive_type primitive_type;
491 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
492 if (primitive_type >= sizeof(input_primitive_type_table) / sizeof(*input_primitive_type_table))
494 FIXME("Unhandled input primitive type %#x.\n", primitive_type);
495 ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
497 else
499 ins->declaration.primitive_type = input_primitive_type_table[primitive_type];
503 static void shader_sm4_read_declaration_count(struct wined3d_shader_instruction *ins,
504 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
505 struct wined3d_sm4_data *priv)
507 ins->declaration.count = *tokens;
510 static void shader_sm4_read_declaration_dst(struct wined3d_shader_instruction *ins,
511 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
512 struct wined3d_sm4_data *priv)
514 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.dst);
517 static void shader_sm4_read_declaration_register_semantic(struct wined3d_shader_instruction *ins,
518 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
519 struct wined3d_sm4_data *priv)
521 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.register_semantic.reg);
522 ins->declaration.register_semantic.sysval_semantic = *tokens;
525 static void shader_sm4_read_dcl_input_ps(struct wined3d_shader_instruction *ins,
526 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
527 struct wined3d_sm4_data *priv)
529 ins->flags = (opcode_token & WINED3D_SM4_INTERPOLATION_MODE_MASK) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT;
530 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.dst);
533 static void shader_sm4_read_dcl_input_ps_siv(struct wined3d_shader_instruction *ins,
534 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
535 struct wined3d_sm4_data *priv)
537 ins->flags = (opcode_token & WINED3D_SM4_INTERPOLATION_MODE_MASK) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT;
538 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.register_semantic.reg);
539 ins->declaration.register_semantic.sysval_semantic = *tokens;
542 static void shader_sm4_read_dcl_global_flags(struct wined3d_shader_instruction *ins,
543 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
544 struct wined3d_sm4_data *priv)
546 ins->flags = (opcode_token & WINED3D_SM4_GLOBAL_FLAGS_MASK) >> WINED3D_SM4_GLOBAL_FLAGS_SHIFT;
549 static void shader_sm5_read_control_point_count(struct wined3d_shader_instruction *ins,
550 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
551 struct wined3d_sm4_data *priv)
553 ins->declaration.count = (opcode_token & WINED3D_SM5_CONTROL_POINT_COUNT_MASK)
554 >> WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT;
557 static void shader_sm5_read_dcl_tessellator_domain(struct wined3d_shader_instruction *ins,
558 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
559 struct wined3d_sm4_data *priv)
561 ins->declaration.tessellator_domain = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
562 >> WINED3D_SM5_TESSELLATOR_SHIFT;
565 static void shader_sm5_read_dcl_tessellator_partitioning(struct wined3d_shader_instruction *ins,
566 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
567 struct wined3d_sm4_data *priv)
569 ins->declaration.tessellator_partitioning = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
570 >> WINED3D_SM5_TESSELLATOR_SHIFT;
573 static void shader_sm5_read_dcl_tessellator_output_primitive(struct wined3d_shader_instruction *ins,
574 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
575 struct wined3d_sm4_data *priv)
577 ins->declaration.tessellator_output_primitive = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
578 >> WINED3D_SM5_TESSELLATOR_SHIFT;
581 static void shader_sm5_read_dcl_hs_max_tessfactor(struct wined3d_shader_instruction *ins,
582 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
583 struct wined3d_sm4_data *priv)
585 ins->declaration.max_tessellation_factor = *(float *)tokens;
588 static void shader_sm5_read_dcl_resource_structured(struct wined3d_shader_instruction *ins,
589 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
590 struct wined3d_sm4_data *priv)
592 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_RESOURCE, &ins->declaration.structured_resource.reg);
593 ins->declaration.structured_resource.byte_stride = *tokens;
597 * f -> WINED3D_DATA_FLOAT
598 * i -> WINED3D_DATA_INT
599 * u -> WINED3D_DATA_UINT
600 * R -> WINED3D_DATA_RESOURCE
601 * S -> WINED3D_DATA_SAMPLER
602 * U -> WINED3D_DATA_UAV
604 static const struct wined3d_sm4_opcode_info opcode_table[] =
606 {WINED3D_SM4_OP_ADD, WINED3DSIH_ADD, "f", "ff"},
607 {WINED3D_SM4_OP_AND, WINED3DSIH_AND, "u", "uu"},
608 {WINED3D_SM4_OP_BREAK, WINED3DSIH_BREAK, "", ""},
609 {WINED3D_SM4_OP_BREAKC, WINED3DSIH_BREAKP, "", "u"},
610 {WINED3D_SM4_OP_CUT, WINED3DSIH_CUT, "", ""},
611 {WINED3D_SM4_OP_DERIV_RTX, WINED3DSIH_DSX, "f", "f"},
612 {WINED3D_SM4_OP_DERIV_RTY, WINED3DSIH_DSY, "f", "f"},
613 {WINED3D_SM4_OP_DISCARD, WINED3DSIH_TEXKILL, "", "u"},
614 {WINED3D_SM4_OP_DIV, WINED3DSIH_DIV, "f", "ff"},
615 {WINED3D_SM4_OP_DP2, WINED3DSIH_DP2, "f", "ff"},
616 {WINED3D_SM4_OP_DP3, WINED3DSIH_DP3, "f", "ff"},
617 {WINED3D_SM4_OP_DP4, WINED3DSIH_DP4, "f", "ff"},
618 {WINED3D_SM4_OP_ELSE, WINED3DSIH_ELSE, "", ""},
619 {WINED3D_SM4_OP_EMIT, WINED3DSIH_EMIT, "", ""},
620 {WINED3D_SM4_OP_ENDIF, WINED3DSIH_ENDIF, "", ""},
621 {WINED3D_SM4_OP_ENDLOOP, WINED3DSIH_ENDLOOP, "", ""},
622 {WINED3D_SM4_OP_EQ, WINED3DSIH_EQ, "u", "ff"},
623 {WINED3D_SM4_OP_EXP, WINED3DSIH_EXP, "f", "f"},
624 {WINED3D_SM4_OP_FRC, WINED3DSIH_FRC, "f", "f"},
625 {WINED3D_SM4_OP_FTOI, WINED3DSIH_FTOI, "i", "f"},
626 {WINED3D_SM4_OP_FTOU, WINED3DSIH_FTOU, "u", "f"},
627 {WINED3D_SM4_OP_GE, WINED3DSIH_GE, "u", "ff"},
628 {WINED3D_SM4_OP_IADD, WINED3DSIH_IADD, "i", "ii"},
629 {WINED3D_SM4_OP_IF, WINED3DSIH_IF, "", "u"},
630 {WINED3D_SM4_OP_IEQ, WINED3DSIH_IEQ, "u", "ii"},
631 {WINED3D_SM4_OP_IGE, WINED3DSIH_IGE, "u", "ii"},
632 {WINED3D_SM4_OP_ILT, WINED3DSIH_ILT, "u", "ii"},
633 {WINED3D_SM4_OP_IMAD, WINED3DSIH_IMAD, "i", "iii"},
634 {WINED3D_SM4_OP_IMAX, WINED3DSIH_IMAX, "i", "ii"},
635 {WINED3D_SM4_OP_IMIN, WINED3DSIH_IMIN, "i", "ii"},
636 {WINED3D_SM4_OP_IMUL, WINED3DSIH_IMUL, "ii", "ii"},
637 {WINED3D_SM4_OP_INE, WINED3DSIH_INE, "u", "ii"},
638 {WINED3D_SM4_OP_INEG, WINED3DSIH_INEG, "i", "i"},
639 {WINED3D_SM4_OP_ISHL, WINED3DSIH_ISHL, "i", "ii"},
640 {WINED3D_SM4_OP_ITOF, WINED3DSIH_ITOF, "f", "i"},
641 {WINED3D_SM4_OP_LD, WINED3DSIH_LD, "u", "iR"},
642 {WINED3D_SM4_OP_LD2DMS, WINED3DSIH_LD2DMS, "u", "iRi"},
643 {WINED3D_SM4_OP_LOG, WINED3DSIH_LOG, "f", "f"},
644 {WINED3D_SM4_OP_LOOP, WINED3DSIH_LOOP, "", ""},
645 {WINED3D_SM4_OP_LT, WINED3DSIH_LT, "u", "ff"},
646 {WINED3D_SM4_OP_MAD, WINED3DSIH_MAD, "f", "fff"},
647 {WINED3D_SM4_OP_MIN, WINED3DSIH_MIN, "f", "ff"},
648 {WINED3D_SM4_OP_MAX, WINED3DSIH_MAX, "f", "ff"},
649 {WINED3D_SM4_OP_SHADER_DATA, WINED3DSIH_DCL_IMMEDIATE_CONSTANT_BUFFER, "", "",
650 shader_sm4_read_shader_data},
651 {WINED3D_SM4_OP_MOV, WINED3DSIH_MOV, "f", "f"},
652 {WINED3D_SM4_OP_MOVC, WINED3DSIH_MOVC, "f", "uff"},
653 {WINED3D_SM4_OP_MUL, WINED3DSIH_MUL, "f", "ff"},
654 {WINED3D_SM4_OP_NE, WINED3DSIH_NE, "u", "ff"},
655 {WINED3D_SM4_OP_NOT, WINED3DSIH_NOT, "u", "u"},
656 {WINED3D_SM4_OP_OR, WINED3DSIH_OR, "u", "uu"},
657 {WINED3D_SM4_OP_RESINFO, WINED3DSIH_RESINFO, "f", "iR"},
658 {WINED3D_SM4_OP_RET, WINED3DSIH_RET, "", ""},
659 {WINED3D_SM4_OP_ROUND_NI, WINED3DSIH_ROUND_NI, "f", "f"},
660 {WINED3D_SM4_OP_ROUND_PI, WINED3DSIH_ROUND_PI, "f", "f"},
661 {WINED3D_SM4_OP_ROUND_Z, WINED3DSIH_ROUND_Z, "f", "f"},
662 {WINED3D_SM4_OP_RSQ, WINED3DSIH_RSQ, "f", "f"},
663 {WINED3D_SM4_OP_SAMPLE, WINED3DSIH_SAMPLE, "u", "fRS"},
664 {WINED3D_SM4_OP_SAMPLE_C, WINED3DSIH_SAMPLE_C, "f", "fRSf"},
665 {WINED3D_SM4_OP_SAMPLE_C_LZ, WINED3DSIH_SAMPLE_C_LZ, "f", "fRSf"},
666 {WINED3D_SM4_OP_SAMPLE_LOD, WINED3DSIH_SAMPLE_LOD, "u", "fRSf"},
667 {WINED3D_SM4_OP_SAMPLE_GRAD, WINED3DSIH_SAMPLE_GRAD, "u", "fRSff"},
668 {WINED3D_SM4_OP_SAMPLE_B, WINED3DSIH_SAMPLE_B, "u", "fRSf"},
669 {WINED3D_SM4_OP_SQRT, WINED3DSIH_SQRT, "f", "f"},
670 {WINED3D_SM4_OP_SINCOS, WINED3DSIH_SINCOS, "ff", "f"},
671 {WINED3D_SM4_OP_UDIV, WINED3DSIH_UDIV, "uu", "uu"},
672 {WINED3D_SM4_OP_ULT, WINED3DSIH_ULT, "u", "uu"},
673 {WINED3D_SM4_OP_UGE, WINED3DSIH_UGE, "u", "uu"},
674 {WINED3D_SM4_OP_USHR, WINED3DSIH_USHR, "u", "uu"},
675 {WINED3D_SM4_OP_UTOF, WINED3DSIH_UTOF, "f", "u"},
676 {WINED3D_SM4_OP_XOR, WINED3DSIH_XOR, "u", "uu"},
677 {WINED3D_SM4_OP_DCL_RESOURCE, WINED3DSIH_DCL, "R", "",
678 shader_sm4_read_dcl_resource},
679 {WINED3D_SM4_OP_DCL_CONSTANT_BUFFER, WINED3DSIH_DCL_CONSTANT_BUFFER, "", "",
680 shader_sm4_read_dcl_constant_buffer},
681 {WINED3D_SM4_OP_DCL_SAMPLER, WINED3DSIH_DCL_SAMPLER, "", "",
682 shader_sm4_read_dcl_sampler},
683 {WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY, WINED3DSIH_DCL_OUTPUT_TOPOLOGY, "", "",
684 shader_sm4_read_dcl_output_topology},
685 {WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE, WINED3DSIH_DCL_INPUT_PRIMITIVE, "", "",
686 shader_sm4_read_dcl_input_primitive},
687 {WINED3D_SM4_OP_DCL_VERTICES_OUT, WINED3DSIH_DCL_VERTICES_OUT, "", "",
688 shader_sm4_read_declaration_count},
689 {WINED3D_SM4_OP_DCL_INPUT, WINED3DSIH_DCL_INPUT, "", "",
690 shader_sm4_read_declaration_dst},
691 {WINED3D_SM4_OP_DCL_INPUT_SGV, WINED3DSIH_DCL_INPUT_SGV, "", "",
692 shader_sm4_read_declaration_register_semantic},
693 {WINED3D_SM4_OP_DCL_INPUT_SIV, WINED3DSIH_DCL_INPUT_SIV, "", "",
694 shader_sm4_read_declaration_register_semantic},
695 {WINED3D_SM4_OP_DCL_INPUT_PS, WINED3DSIH_DCL_INPUT_PS, "", "",
696 shader_sm4_read_dcl_input_ps},
697 {WINED3D_SM4_OP_DCL_INPUT_PS_SGV, WINED3DSIH_DCL_INPUT_PS_SGV, "", "",
698 shader_sm4_read_declaration_register_semantic},
699 {WINED3D_SM4_OP_DCL_INPUT_PS_SIV, WINED3DSIH_DCL_INPUT_PS_SIV, "", "",
700 shader_sm4_read_dcl_input_ps_siv},
701 {WINED3D_SM4_OP_DCL_OUTPUT, WINED3DSIH_DCL_OUTPUT, "", "",
702 shader_sm4_read_declaration_dst},
703 {WINED3D_SM4_OP_DCL_OUTPUT_SIV, WINED3DSIH_DCL_OUTPUT_SIV, "", "",
704 shader_sm4_read_declaration_register_semantic},
705 {WINED3D_SM4_OP_DCL_TEMPS, WINED3DSIH_DCL_TEMPS, "", "",
706 shader_sm4_read_declaration_count},
707 {WINED3D_SM4_OP_DCL_GLOBAL_FLAGS, WINED3DSIH_DCL_GLOBAL_FLAGS, "", "",
708 shader_sm4_read_dcl_global_flags},
709 {WINED3D_SM5_OP_HS_DECLS, WINED3DSIH_HS_DECLS, "", ""},
710 {WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE, WINED3DSIH_HS_CONTROL_POINT_PHASE, "", ""},
711 {WINED3D_SM5_OP_HS_FORK_PHASE, WINED3DSIH_HS_FORK_PHASE, "", ""},
712 {WINED3D_SM5_OP_HS_JOIN_PHASE, WINED3DSIH_HS_JOIN_PHASE, "", ""},
713 {WINED3D_SM5_OP_DERIV_RTX_COARSE, WINED3DSIH_DSX_COARSE, "f", "f"},
714 {WINED3D_SM5_OP_DERIV_RTX_FINE, WINED3DSIH_DSX_FINE, "f", "f"},
715 {WINED3D_SM5_OP_DERIV_RTY_COARSE, WINED3DSIH_DSY_COARSE, "f", "f"},
716 {WINED3D_SM5_OP_DERIV_RTY_FINE, WINED3DSIH_DSY_FINE, "f", "f"},
717 {WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT, WINED3DSIH_DCL_INPUT_CONTROL_POINT_COUNT, "", "",
718 shader_sm5_read_control_point_count},
719 {WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT, WINED3DSIH_DCL_OUTPUT_CONTROL_POINT_COUNT, "", "",
720 shader_sm5_read_control_point_count},
721 {WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN, WINED3DSIH_DCL_TESSELLATOR_DOMAIN, "", "",
722 shader_sm5_read_dcl_tessellator_domain},
723 {WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING, WINED3DSIH_DCL_TESSELLATOR_PARTITIONING, "", "",
724 shader_sm5_read_dcl_tessellator_partitioning},
725 {WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, WINED3DSIH_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, "", "",
726 shader_sm5_read_dcl_tessellator_output_primitive},
727 {WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR, WINED3DSIH_DCL_HS_MAX_TESSFACTOR, "", "",
728 shader_sm5_read_dcl_hs_max_tessfactor},
729 {WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT, WINED3DSIH_DCL_HS_FORK_PHASE_INSTANCE_COUNT, "", "",
730 shader_sm4_read_declaration_count},
731 {WINED3D_SM5_OP_DCL_UAV_TYPED, WINED3DSIH_DCL_UAV_TYPED, "", "",
732 shader_sm4_read_dcl_resource},
733 {WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED, WINED3DSIH_DCL_RESOURCE_STRUCTURED, "", "",
734 shader_sm5_read_dcl_resource_structured},
735 {WINED3D_SM5_OP_STORE_UAV_TYPED, WINED3DSIH_STORE_UAV_TYPED, "", "Uif"},
736 {WINED3D_SM5_OP_LD_STRUCTURED, WINED3DSIH_LD_STRUCTURED, "u", "uuR"},
739 static const enum wined3d_shader_register_type register_type_table[] =
741 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP,
742 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT,
743 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT,
744 /* UNKNOWN */ ~0u,
745 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST,
746 /* UNKNOWN */ ~0u,
747 /* WINED3D_SM4_RT_SAMPLER */ WINED3DSPR_SAMPLER,
748 /* WINED3D_SM4_RT_RESOURCE */ WINED3DSPR_RESOURCE,
749 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER,
750 /* WINED3D_SM4_RT_IMMCONSTBUFFER */ WINED3DSPR_IMMCONSTBUFFER,
751 /* UNKNOWN */ ~0u,
752 /* WINED3D_SM4_RT_PRIMID */ WINED3DSPR_PRIMID,
753 /* WINED3D_SM4_RT_DEPTHOUT */ WINED3DSPR_DEPTHOUT,
754 /* WINED3D_SM4_RT_NULL */ WINED3DSPR_NULL,
755 /* UNKNOWN */ ~0u,
756 /* UNKNOWN */ ~0u,
757 /* UNKNOWN */ ~0u,
758 /* UNKNOWN */ ~0u,
759 /* UNKNOWN */ ~0u,
760 /* UNKNOWN */ ~0u,
761 /* UNKNOWN */ ~0u,
762 /* UNKNOWN */ ~0u,
763 /* WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID */ WINED3DSPR_OUTPOINTID,
764 /* WINED3D_SM5_RT_FORK_INSTANCE_ID */ WINED3DSPR_FORKINSTID,
765 /* UNKNOWN */ ~0u,
766 /* WINED3D_SM5_RT_INPUT_CONTROL_POINT */ WINED3DSPR_INCONTROLPOINT,
767 /* UNKNOWN */ ~0u,
768 /* WINED3D_SM5_RT_PATCH_CONSTANT_DATA */ WINED3DSPR_PATCHCONST,
769 /* WINED3D_SM5_RT_DOMAIN_LOCATION */ WINED3DSPR_TESSCOORD,
770 /* UNKNOWN */ ~0u,
771 /* WINED3D_SM5_RT_UAV */ WINED3DSPR_UAV,
774 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
776 unsigned int i;
778 for (i = 0; i < sizeof(opcode_table) / sizeof(*opcode_table); ++i)
780 if (opcode == opcode_table[i].opcode) return &opcode_table[i];
783 return NULL;
786 static void map_register(const struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
788 switch (priv->shader_version.type)
790 case WINED3D_SHADER_TYPE_PIXEL:
791 if (reg->type == WINED3DSPR_OUTPUT)
793 unsigned int reg_idx = reg->idx[0].offset;
795 if (reg_idx >= ARRAY_SIZE(priv->output_map))
797 ERR("Invalid output index %u.\n", reg_idx);
798 break;
801 reg->type = WINED3DSPR_COLOROUT;
802 reg->idx[0].offset = priv->output_map[reg_idx];
804 break;
806 default:
807 break;
811 static enum wined3d_data_type map_data_type(char t)
813 switch (t)
815 case 'f':
816 return WINED3D_DATA_FLOAT;
817 case 'i':
818 return WINED3D_DATA_INT;
819 case 'u':
820 return WINED3D_DATA_UINT;
821 case 'R':
822 return WINED3D_DATA_RESOURCE;
823 case 'S':
824 return WINED3D_DATA_SAMPLER;
825 case 'U':
826 return WINED3D_DATA_UAV;
827 default:
828 ERR("Invalid data type '%c'.\n", t);
829 return WINED3D_DATA_FLOAT;
833 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
835 struct wined3d_sm4_data *priv;
836 unsigned int i;
838 if (!(priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv))))
840 ERR("Failed to allocate private data\n");
841 return NULL;
844 memset(priv->output_map, 0xff, sizeof(priv->output_map));
845 for (i = 0; i < output_signature->element_count; ++i)
847 struct wined3d_shader_signature_element *e = &output_signature->elements[i];
849 if (e->register_idx >= ARRAY_SIZE(priv->output_map))
851 WARN("Invalid output index %u.\n", e->register_idx);
852 continue;
855 priv->output_map[e->register_idx] = e->semantic_idx;
858 list_init(&priv->src_free);
859 list_init(&priv->src);
861 return priv;
864 static void shader_sm4_free(void *data)
866 struct wined3d_shader_src_param_entry *e1, *e2;
867 struct wined3d_sm4_data *priv = data;
869 list_move_head(&priv->src_free, &priv->src);
870 LIST_FOR_EACH_ENTRY_SAFE(e1, e2, &priv->src_free, struct wined3d_shader_src_param_entry, entry)
872 HeapFree(GetProcessHeap(), 0, e1);
874 HeapFree(GetProcessHeap(), 0, priv);
877 static struct wined3d_shader_src_param *get_src_param(struct wined3d_sm4_data *priv)
879 struct wined3d_shader_src_param_entry *e;
880 struct list *elem;
882 if (!list_empty(&priv->src_free))
884 elem = list_head(&priv->src_free);
885 list_remove(elem);
887 else
889 if (!(e = HeapAlloc(GetProcessHeap(), 0, sizeof(*e))))
890 return NULL;
891 elem = &e->entry;
894 list_add_tail(&priv->src, elem);
895 e = LIST_ENTRY(elem, struct wined3d_shader_src_param_entry, entry);
896 return &e->param;
899 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
901 struct wined3d_sm4_data *priv = data;
902 DWORD version_token;
904 priv->end = *ptr;
906 version_token = *(*ptr)++;
907 TRACE("Version: 0x%08x.\n", version_token);
909 TRACE("Token count: %u.\n", **ptr);
910 priv->end += *(*ptr)++;
912 switch (version_token >> 16)
914 case WINED3D_SM4_PS:
915 priv->shader_version.type = WINED3D_SHADER_TYPE_PIXEL;
916 break;
918 case WINED3D_SM4_VS:
919 priv->shader_version.type = WINED3D_SHADER_TYPE_VERTEX;
920 break;
922 case WINED3D_SM4_GS:
923 priv->shader_version.type = WINED3D_SHADER_TYPE_GEOMETRY;
924 break;
926 case WINED3D_SM5_HS:
927 priv->shader_version.type = WINED3D_SHADER_TYPE_HULL;
928 break;
930 case WINED3D_SM5_DS:
931 priv->shader_version.type = WINED3D_SHADER_TYPE_DOMAIN;
932 break;
934 default:
935 FIXME("Unrecognized shader type %#x.\n", version_token >> 16);
937 priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
938 priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
940 *shader_version = priv->shader_version;
943 static BOOL shader_sm4_read_reg_idx(struct wined3d_sm4_data *priv, const DWORD **ptr,
944 DWORD addressing, struct wined3d_shader_register_index *reg_idx)
946 if (addressing & WINED3D_SM4_ADDRESSING_RELATIVE)
948 struct wined3d_shader_src_param *rel_addr = get_src_param(priv);
950 if (!(reg_idx->rel_addr = rel_addr))
952 ERR("Failed to get src param for relative addressing.\n");
953 return FALSE;
956 if (addressing & WINED3D_SM4_ADDRESSING_OFFSET)
957 reg_idx->offset = *(*ptr)++;
958 else
959 reg_idx->offset = 0;
960 shader_sm4_read_src_param(priv, ptr, WINED3D_DATA_INT, rel_addr);
962 else
964 reg_idx->rel_addr = NULL;
965 reg_idx->offset = *(*ptr)++;
968 return TRUE;
971 static BOOL shader_sm4_read_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
972 enum wined3d_data_type data_type, struct wined3d_shader_register *param,
973 enum wined3d_shader_src_modifier *modifier)
975 enum wined3d_sm4_register_type register_type;
976 DWORD token = *(*ptr)++;
977 DWORD order;
979 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
980 if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table)
981 || register_type_table[register_type] == ~0u)
983 FIXME("Unhandled register type %#x.\n", register_type);
984 param->type = WINED3DSPR_TEMP;
986 else
988 param->type = register_type_table[register_type];
990 param->data_type = data_type;
992 if (token & WINED3D_SM4_REGISTER_MODIFIER)
994 DWORD m = *(*ptr)++;
996 switch (m)
998 case 0x41:
999 *modifier = WINED3DSPSM_NEG;
1000 break;
1002 case 0x81:
1003 *modifier = WINED3DSPSM_ABS;
1004 break;
1006 case 0xc1:
1007 *modifier = WINED3DSPSM_ABSNEG;
1008 break;
1010 default:
1011 FIXME("Skipping modifier 0x%08x.\n", m);
1012 *modifier = WINED3DSPSM_NONE;
1013 break;
1016 else
1018 *modifier = WINED3DSPSM_NONE;
1021 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
1023 if (order < 1)
1024 param->idx[0].offset = ~0U;
1025 else
1027 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK0) >> WINED3D_SM4_ADDRESSING_SHIFT0;
1028 if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[0])))
1030 ERR("Failed to read register index.\n");
1031 return FALSE;
1035 if (order < 2)
1036 param->idx[1].offset = ~0U;
1037 else
1039 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK1) >> WINED3D_SM4_ADDRESSING_SHIFT1;
1040 if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[1])))
1042 ERR("Failed to read register index.\n");
1043 return FALSE;
1047 if (order > 2)
1048 FIXME("Unhandled order %u.\n", order);
1050 if (register_type == WINED3D_SM4_RT_IMMCONST)
1052 enum wined3d_sm4_immconst_type immconst_type =
1053 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
1055 switch (immconst_type)
1057 case WINED3D_SM4_IMMCONST_SCALAR:
1058 param->immconst_type = WINED3D_IMMCONST_SCALAR;
1059 memcpy(param->immconst_data, *ptr, 1 * sizeof(DWORD));
1060 *ptr += 1;
1061 break;
1063 case WINED3D_SM4_IMMCONST_VEC4:
1064 param->immconst_type = WINED3D_IMMCONST_VEC4;
1065 memcpy(param->immconst_data, *ptr, 4 * sizeof(DWORD));
1066 *ptr += 4;
1067 break;
1069 default:
1070 FIXME("Unhandled immediate constant type %#x.\n", immconst_type);
1071 break;
1075 map_register(priv, param);
1077 return TRUE;
1080 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
1081 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param)
1083 DWORD token = **ptr;
1085 if (!shader_sm4_read_param(priv, ptr, data_type, &src_param->reg, &src_param->modifiers))
1087 ERR("Failed to read parameter.\n");
1088 return FALSE;
1091 if (src_param->reg.type == WINED3DSPR_IMMCONST)
1093 src_param->swizzle = WINED3DSP_NOSWIZZLE;
1095 else
1097 enum wined3d_sm4_swizzle_type swizzle_type =
1098 (token & WINED3D_SM4_SWIZZLE_TYPE_MASK) >> WINED3D_SM4_SWIZZLE_TYPE_SHIFT;
1100 switch (swizzle_type)
1102 case WINED3D_SM4_SWIZZLE_NONE:
1103 src_param->swizzle = WINED3DSP_NOSWIZZLE;
1104 break;
1106 case WINED3D_SM4_SWIZZLE_SCALAR:
1107 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
1108 src_param->swizzle = (src_param->swizzle & 0x3) * 0x55;
1109 break;
1111 case WINED3D_SM4_SWIZZLE_VEC4:
1112 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
1113 break;
1115 default:
1116 FIXME("Unhandled swizzle type %#x.\n", swizzle_type);
1117 break;
1121 return TRUE;
1124 static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
1125 enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param)
1127 enum wined3d_shader_src_modifier modifier;
1128 DWORD token = **ptr;
1130 if (!shader_sm4_read_param(priv, ptr, data_type, &dst_param->reg, &modifier))
1132 ERR("Failed to read parameter.\n");
1133 return FALSE;
1136 if (modifier != WINED3DSPSM_NONE)
1138 ERR("Invalid source modifier %#x on destination register.\n", modifier);
1139 return FALSE;
1142 dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
1143 dst_param->modifiers = 0;
1144 dst_param->shift = 0;
1146 return TRUE;
1149 static void shader_sm4_read_instruction(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins)
1151 const struct wined3d_sm4_opcode_info *opcode_info;
1152 struct wined3d_sm4_data *priv = data;
1153 DWORD opcode_token, opcode;
1154 unsigned int i, len;
1155 const DWORD *p;
1157 list_move_head(&priv->src_free, &priv->src);
1159 opcode_token = *(*ptr)++;
1160 opcode = opcode_token & WINED3D_SM4_OPCODE_MASK;
1162 len = ((opcode_token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT);
1163 if (!len)
1164 len = **ptr;
1165 --len;
1167 if (TRACE_ON(d3d_bytecode))
1169 TRACE_(d3d_bytecode)("[ %08x ", opcode_token);
1170 for (i = 0; i < len; ++i)
1172 TRACE_(d3d_bytecode)("%08x ", (*ptr)[i]);
1174 TRACE_(d3d_bytecode)("]\n");
1177 if (!(opcode_info = get_opcode_info(opcode)))
1179 FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode, opcode_token);
1180 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1181 *ptr += len;
1182 return;
1185 ins->handler_idx = opcode_info->handler_idx;
1186 ins->flags = 0;
1187 ins->coissue = 0;
1188 ins->predicate = NULL;
1189 ins->dst_count = strlen(opcode_info->dst_info);
1190 ins->dst = priv->dst_param;
1191 ins->src_count = strlen(opcode_info->src_info);
1192 ins->src = priv->src_param;
1193 memset(&ins->texel_offset, 0, sizeof(ins->texel_offset));
1195 p = *ptr;
1196 *ptr += len;
1198 if (opcode_token & WINED3D_SM4_INSTRUCTION_MODIFIER)
1200 static const DWORD recognized_bits = WINED3D_SM4_MODIFIER_AOFFIMMI
1201 | WINED3D_SM4_AOFFIMMI_U_MASK
1202 | WINED3D_SM4_AOFFIMMI_V_MASK
1203 | WINED3D_SM4_AOFFIMMI_W_MASK;
1204 DWORD modifier = *p++;
1205 /* Bit fields are used for sign extension */
1206 struct
1208 int u : 4;
1209 int v : 4;
1210 int w : 4;
1212 aoffimmi;
1214 if (modifier & ~recognized_bits)
1216 FIXME("Skipping modifier 0x%08x.\n", modifier);
1218 else
1220 aoffimmi.u = (modifier & WINED3D_SM4_AOFFIMMI_U_MASK) >> WINED3D_SM4_AOFFIMMI_U_SHIFT;
1221 aoffimmi.v = (modifier & WINED3D_SM4_AOFFIMMI_V_MASK) >> WINED3D_SM4_AOFFIMMI_V_SHIFT;
1222 aoffimmi.w = (modifier & WINED3D_SM4_AOFFIMMI_W_MASK) >> WINED3D_SM4_AOFFIMMI_W_SHIFT;
1223 ins->texel_offset.u = aoffimmi.u;
1224 ins->texel_offset.v = aoffimmi.v;
1225 ins->texel_offset.w = aoffimmi.w;
1229 if (opcode_info->read_opcode_func)
1231 opcode_info->read_opcode_func(ins, opcode, opcode_token, p, len, priv);
1233 else
1235 enum wined3d_shader_dst_modifier instruction_dst_modifier = WINED3DSPDM_NONE;
1237 ins->flags = (opcode_token & WINED3D_SM4_INSTRUCTION_FLAGS_MASK) >> WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT;
1239 if (ins->flags & WINED3D_SM4_INSTRUCTION_FLAG_SATURATE)
1241 ins->flags &= ~WINED3D_SM4_INSTRUCTION_FLAG_SATURATE;
1242 instruction_dst_modifier = WINED3DSPDM_SATURATE;
1245 for (i = 0; i < ins->dst_count; ++i)
1247 if (!(shader_sm4_read_dst_param(priv, &p, map_data_type(opcode_info->dst_info[i]), &priv->dst_param[i])))
1249 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1250 return;
1252 priv->dst_param[i].modifiers |= instruction_dst_modifier;
1255 for (i = 0; i < ins->src_count; ++i)
1257 if (!(shader_sm4_read_src_param(priv, &p, map_data_type(opcode_info->src_info[i]), &priv->src_param[i])))
1259 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1260 return;
1266 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
1268 struct wined3d_sm4_data *priv = data;
1269 return *ptr == priv->end;
1272 const struct wined3d_shader_frontend sm4_shader_frontend =
1274 shader_sm4_init,
1275 shader_sm4_free,
1276 shader_sm4_read_header,
1277 shader_sm4_read_instruction,
1278 shader_sm4_is_end,