wined3d: Recognize SM5 imm_atomic_imax opcode.
[wine.git] / dlls / wined3d / shader_sm4.c
blob44a9da98f527bad48dd2bcaba8998c56ba52f46a
1 /*
2 * Copyright 2009 Henri Verbeet for CodeWeavers
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
19 #include "config.h"
20 #include "wine/port.h"
22 #include "wined3d_private.h"
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
25 WINE_DECLARE_DEBUG_CHANNEL(d3d_bytecode);
27 #define WINED3D_SM4_INSTRUCTION_MODIFIER (0x1u << 31)
29 #define WINED3D_SM4_MODIFIER_AOFFIMMI 0x1
30 #define WINED3D_SM4_AOFFIMMI_U_SHIFT 9
31 #define WINED3D_SM4_AOFFIMMI_U_MASK (0xfu << WINED3D_SM4_AOFFIMMI_U_SHIFT)
32 #define WINED3D_SM4_AOFFIMMI_V_SHIFT 13
33 #define WINED3D_SM4_AOFFIMMI_V_MASK (0xfu << WINED3D_SM4_AOFFIMMI_V_SHIFT)
34 #define WINED3D_SM4_AOFFIMMI_W_SHIFT 17
35 #define WINED3D_SM4_AOFFIMMI_W_MASK (0xfu << WINED3D_SM4_AOFFIMMI_W_SHIFT)
37 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
38 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0x1fu << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
40 #define WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT 11
41 #define WINED3D_SM4_INSTRUCTION_FLAGS_MASK (0x7u << WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT)
43 #define WINED3D_SM4_RESOURCE_TYPE_SHIFT 11
44 #define WINED3D_SM4_RESOURCE_TYPE_MASK (0xfu << WINED3D_SM4_RESOURCE_TYPE_SHIFT)
46 #define WINED3D_SM4_PRIMITIVE_TYPE_SHIFT 11
47 #define WINED3D_SM4_PRIMITIVE_TYPE_MASK (0x7u << WINED3D_SM4_PRIMITIVE_TYPE_SHIFT)
49 #define WINED3D_SM4_INDEX_TYPE_SHIFT 11
50 #define WINED3D_SM4_INDEX_TYPE_MASK (0x1u << WINED3D_SM4_INDEX_TYPE_SHIFT)
52 #define WINED3D_SM4_SAMPLER_MODE_SHIFT 11
53 #define WINED3D_SM4_SAMPLER_MODE_MASK (0xfu << WINED3D_SM4_SAMPLER_MODE_SHIFT)
55 #define WINED3D_SM4_SHADER_DATA_TYPE_SHIFT 11
56 #define WINED3D_SM4_SHADER_DATA_TYPE_MASK (0xfu << WINED3D_SM4_SHADER_DATA_TYPE_SHIFT)
58 #define WINED3D_SM4_INTERPOLATION_MODE_SHIFT 11
59 #define WINED3D_SM4_INTERPOLATION_MODE_MASK (0xfu << WINED3D_SM4_INTERPOLATION_MODE_SHIFT)
61 #define WINED3D_SM4_GLOBAL_FLAGS_SHIFT 11
62 #define WINED3D_SM4_GLOBAL_FLAGS_MASK (0xffu << WINED3D_SM4_GLOBAL_FLAGS_SHIFT)
64 #define WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT 11
65 #define WINED3D_SM5_CONTROL_POINT_COUNT_MASK (0xffu << WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT)
67 #define WINED3D_SM5_FP_ARRAY_SIZE_SHIFT 16
68 #define WINED3D_SM5_FP_TABLE_COUNT_MASK 0xffffu
70 #define WINED3D_SM5_UAV_FLAGS_SHIFT 11
71 #define WINED3D_SM5_UAV_FLAGS_MASK (0x8fffu << WINED3D_SM5_UAV_FLAGS_SHIFT)
73 #define WINED3D_SM5_SYNC_FLAGS_SHIFT 11
74 #define WINED3D_SM5_SYNC_FLAGS_MASK (0xffu << WINED3D_SM5_SYNC_FLAGS_SHIFT)
76 #define WINED3D_SM5_TESSELLATOR_SHIFT 11
77 #define WINED3D_SM5_TESSELLATOR_MASK (0xfu << WINED3D_SM5_TESSELLATOR_SHIFT)
79 #define WINED3D_SM4_OPCODE_MASK 0xff
81 #define WINED3D_SM4_REGISTER_MODIFIER (0x1u << 31)
83 #define WINED3D_SM4_ADDRESSING_SHIFT1 25
84 #define WINED3D_SM4_ADDRESSING_MASK1 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT1)
86 #define WINED3D_SM4_ADDRESSING_SHIFT0 22
87 #define WINED3D_SM4_ADDRESSING_MASK0 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT0)
89 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
90 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3u << WINED3D_SM4_REGISTER_ORDER_SHIFT)
92 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
93 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xffu << WINED3D_SM4_REGISTER_TYPE_SHIFT)
95 #define WINED3D_SM4_SWIZZLE_TYPE_SHIFT 2
96 #define WINED3D_SM4_SWIZZLE_TYPE_MASK (0x3u << WINED3D_SM4_SWIZZLE_TYPE_SHIFT)
98 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT 0
99 #define WINED3D_SM4_IMMCONST_TYPE_MASK (0x3u << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
101 #define WINED3D_SM4_WRITEMASK_SHIFT 4
102 #define WINED3D_SM4_WRITEMASK_MASK (0xfu << WINED3D_SM4_WRITEMASK_SHIFT)
104 #define WINED3D_SM4_SWIZZLE_SHIFT 4
105 #define WINED3D_SM4_SWIZZLE_MASK (0xffu << WINED3D_SM4_SWIZZLE_SHIFT)
107 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
108 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
110 #define WINED3D_SM4_ADDRESSING_RELATIVE 0x2
111 #define WINED3D_SM4_ADDRESSING_OFFSET 0x1
113 #define WINED3D_SM4_INSTRUCTION_FLAG_SATURATE 0x4
115 #define WINED3D_SM4_CONDITIONAL_NZ (0x1u << 18)
117 enum wined3d_sm4_opcode
119 WINED3D_SM4_OP_ADD = 0x00,
120 WINED3D_SM4_OP_AND = 0x01,
121 WINED3D_SM4_OP_BREAK = 0x02,
122 WINED3D_SM4_OP_BREAKC = 0x03,
123 WINED3D_SM4_OP_CASE = 0x06,
124 WINED3D_SM4_OP_CONTINUE = 0x07,
125 WINED3D_SM4_OP_CUT = 0x09,
126 WINED3D_SM4_OP_DEFAULT = 0x0a,
127 WINED3D_SM4_OP_DERIV_RTX = 0x0b,
128 WINED3D_SM4_OP_DERIV_RTY = 0x0c,
129 WINED3D_SM4_OP_DISCARD = 0x0d,
130 WINED3D_SM4_OP_DIV = 0x0e,
131 WINED3D_SM4_OP_DP2 = 0x0f,
132 WINED3D_SM4_OP_DP3 = 0x10,
133 WINED3D_SM4_OP_DP4 = 0x11,
134 WINED3D_SM4_OP_ELSE = 0x12,
135 WINED3D_SM4_OP_EMIT = 0x13,
136 WINED3D_SM4_OP_ENDIF = 0x15,
137 WINED3D_SM4_OP_ENDLOOP = 0x16,
138 WINED3D_SM4_OP_ENDSWITCH = 0x17,
139 WINED3D_SM4_OP_EQ = 0x18,
140 WINED3D_SM4_OP_EXP = 0x19,
141 WINED3D_SM4_OP_FRC = 0x1a,
142 WINED3D_SM4_OP_FTOI = 0x1b,
143 WINED3D_SM4_OP_FTOU = 0x1c,
144 WINED3D_SM4_OP_GE = 0x1d,
145 WINED3D_SM4_OP_IADD = 0x1e,
146 WINED3D_SM4_OP_IF = 0x1f,
147 WINED3D_SM4_OP_IEQ = 0x20,
148 WINED3D_SM4_OP_IGE = 0x21,
149 WINED3D_SM4_OP_ILT = 0x22,
150 WINED3D_SM4_OP_IMAD = 0x23,
151 WINED3D_SM4_OP_IMAX = 0x24,
152 WINED3D_SM4_OP_IMIN = 0x25,
153 WINED3D_SM4_OP_IMUL = 0x26,
154 WINED3D_SM4_OP_INE = 0x27,
155 WINED3D_SM4_OP_INEG = 0x28,
156 WINED3D_SM4_OP_ISHL = 0x29,
157 WINED3D_SM4_OP_ISHR = 0x2a,
158 WINED3D_SM4_OP_ITOF = 0x2b,
159 WINED3D_SM4_OP_LABEL = 0x2c,
160 WINED3D_SM4_OP_LD = 0x2d,
161 WINED3D_SM4_OP_LD2DMS = 0x2e,
162 WINED3D_SM4_OP_LOG = 0x2f,
163 WINED3D_SM4_OP_LOOP = 0x30,
164 WINED3D_SM4_OP_LT = 0x31,
165 WINED3D_SM4_OP_MAD = 0x32,
166 WINED3D_SM4_OP_MIN = 0x33,
167 WINED3D_SM4_OP_MAX = 0x34,
168 WINED3D_SM4_OP_SHADER_DATA = 0x35,
169 WINED3D_SM4_OP_MOV = 0x36,
170 WINED3D_SM4_OP_MOVC = 0x37,
171 WINED3D_SM4_OP_MUL = 0x38,
172 WINED3D_SM4_OP_NE = 0x39,
173 WINED3D_SM4_OP_NOT = 0x3b,
174 WINED3D_SM4_OP_OR = 0x3c,
175 WINED3D_SM4_OP_RESINFO = 0x3d,
176 WINED3D_SM4_OP_RET = 0x3e,
177 WINED3D_SM4_OP_ROUND_NE = 0x40,
178 WINED3D_SM4_OP_ROUND_NI = 0x41,
179 WINED3D_SM4_OP_ROUND_PI = 0x42,
180 WINED3D_SM4_OP_ROUND_Z = 0x43,
181 WINED3D_SM4_OP_RSQ = 0x44,
182 WINED3D_SM4_OP_SAMPLE = 0x45,
183 WINED3D_SM4_OP_SAMPLE_C = 0x46,
184 WINED3D_SM4_OP_SAMPLE_C_LZ = 0x47,
185 WINED3D_SM4_OP_SAMPLE_LOD = 0x48,
186 WINED3D_SM4_OP_SAMPLE_GRAD = 0x49,
187 WINED3D_SM4_OP_SAMPLE_B = 0x4a,
188 WINED3D_SM4_OP_SQRT = 0x4b,
189 WINED3D_SM4_OP_SWITCH = 0x4c,
190 WINED3D_SM4_OP_SINCOS = 0x4d,
191 WINED3D_SM4_OP_UDIV = 0x4e,
192 WINED3D_SM4_OP_ULT = 0x4f,
193 WINED3D_SM4_OP_UGE = 0x50,
194 WINED3D_SM4_OP_UMAX = 0x53,
195 WINED3D_SM4_OP_UMIN = 0x54,
196 WINED3D_SM4_OP_USHR = 0x55,
197 WINED3D_SM4_OP_UTOF = 0x56,
198 WINED3D_SM4_OP_XOR = 0x57,
199 WINED3D_SM4_OP_DCL_RESOURCE = 0x58,
200 WINED3D_SM4_OP_DCL_CONSTANT_BUFFER = 0x59,
201 WINED3D_SM4_OP_DCL_SAMPLER = 0x5a,
202 WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY = 0x5c,
203 WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE = 0x5d,
204 WINED3D_SM4_OP_DCL_VERTICES_OUT = 0x5e,
205 WINED3D_SM4_OP_DCL_INPUT = 0x5f,
206 WINED3D_SM4_OP_DCL_INPUT_SGV = 0x60,
207 WINED3D_SM4_OP_DCL_INPUT_SIV = 0x61,
208 WINED3D_SM4_OP_DCL_INPUT_PS = 0x62,
209 WINED3D_SM4_OP_DCL_INPUT_PS_SGV = 0x63,
210 WINED3D_SM4_OP_DCL_INPUT_PS_SIV = 0x64,
211 WINED3D_SM4_OP_DCL_OUTPUT = 0x65,
212 WINED3D_SM4_OP_DCL_OUTPUT_SIV = 0x67,
213 WINED3D_SM4_OP_DCL_TEMPS = 0x68,
214 WINED3D_SM4_OP_DCL_INDEXABLE_TEMP = 0x69,
215 WINED3D_SM4_OP_DCL_GLOBAL_FLAGS = 0x6a,
216 WINED3D_SM4_OP_LOD = 0x6c,
217 WINED3D_SM4_OP_GATHER4 = 0x6d,
218 WINED3D_SM4_OP_SAMPLE_POS = 0x6e,
219 WINED3D_SM4_OP_SAMPLE_INFO = 0x6f,
220 WINED3D_SM5_OP_HS_DECLS = 0x71,
221 WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE = 0x72,
222 WINED3D_SM5_OP_HS_FORK_PHASE = 0x73,
223 WINED3D_SM5_OP_HS_JOIN_PHASE = 0x74,
224 WINED3D_SM5_OP_EMIT_STREAM = 0x75,
225 WINED3D_SM5_OP_CUT_STREAM = 0x76,
226 WINED3D_SM5_OP_FCALL = 0x78,
227 WINED3D_SM5_OP_BUFINFO = 0x79,
228 WINED3D_SM5_OP_DERIV_RTX_COARSE = 0x7a,
229 WINED3D_SM5_OP_DERIV_RTX_FINE = 0x7b,
230 WINED3D_SM5_OP_DERIV_RTY_COARSE = 0x7c,
231 WINED3D_SM5_OP_DERIV_RTY_FINE = 0x7d,
232 WINED3D_SM5_OP_GATHER4_C = 0x7e,
233 WINED3D_SM5_OP_RCP = 0x81,
234 WINED3D_SM5_OP_F32TOF16 = 0x82,
235 WINED3D_SM5_OP_F16TOF32 = 0x83,
236 WINED3D_SM5_OP_COUNTBITS = 0x86,
237 WINED3D_SM5_OP_FIRSTBIT_HI = 0x87,
238 WINED3D_SM5_OP_FIRSTBIT_LO = 0x88,
239 WINED3D_SM5_OP_FIRSTBIT_SHI = 0x89,
240 WINED3D_SM5_OP_UBFE = 0x8a,
241 WINED3D_SM5_OP_BFI = 0x8c,
242 WINED3D_SM5_OP_BFREV = 0x8d,
243 WINED3D_SM5_OP_SWAPC = 0x8e,
244 WINED3D_SM5_OP_DCL_STREAM = 0x8f,
245 WINED3D_SM5_OP_DCL_FUNCTION_BODY = 0x90,
246 WINED3D_SM5_OP_DCL_FUNCTION_TABLE = 0x91,
247 WINED3D_SM5_OP_DCL_INTERFACE = 0x92,
248 WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT = 0x93,
249 WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT = 0x94,
250 WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN = 0x95,
251 WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING = 0x96,
252 WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE = 0x97,
253 WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR = 0x98,
254 WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT = 0x99,
255 WINED3D_SM5_OP_DCL_THREAD_GROUP = 0x9b,
256 WINED3D_SM5_OP_DCL_UAV_TYPED = 0x9c,
257 WINED3D_SM5_OP_DCL_UAV_RAW = 0x9d,
258 WINED3D_SM5_OP_DCL_UAV_STRUCTURED = 0x9e,
259 WINED3D_SM5_OP_DCL_TGSM_RAW = 0x9f,
260 WINED3D_SM5_OP_DCL_TGSM_STRUCTURED = 0xa0,
261 WINED3D_SM5_OP_DCL_RESOURCE_RAW = 0xa1,
262 WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED = 0xa2,
263 WINED3D_SM5_OP_LD_UAV_TYPED = 0xa3,
264 WINED3D_SM5_OP_STORE_UAV_TYPED = 0xa4,
265 WINED3D_SM5_OP_LD_RAW = 0xa5,
266 WINED3D_SM5_OP_STORE_RAW = 0xa6,
267 WINED3D_SM5_OP_LD_STRUCTURED = 0xa7,
268 WINED3D_SM5_OP_STORE_STRUCTURED = 0xa8,
269 WINED3D_SM5_OP_ATOMIC_AND = 0xa9,
270 WINED3D_SM5_OP_ATOMIC_OR = 0xaa,
271 WINED3D_SM5_OP_ATOMIC_XOR = 0xab,
272 WINED3D_SM5_OP_ATOMIC_CMP_STORE = 0xac,
273 WINED3D_SM5_OP_ATOMIC_IADD = 0xad,
274 WINED3D_SM5_OP_ATOMIC_IMAX = 0xae,
275 WINED3D_SM5_OP_ATOMIC_IMIN = 0xaf,
276 WINED3D_SM5_OP_ATOMIC_UMAX = 0xb0,
277 WINED3D_SM5_OP_ATOMIC_UMIN = 0xb1,
278 WINED3D_SM5_OP_IMM_ATOMIC_ALLOC = 0xb2,
279 WINED3D_SM5_OP_IMM_ATOMIC_CONSUME = 0xb3,
280 WINED3D_SM5_OP_IMM_ATOMIC_IADD = 0xb4,
281 WINED3D_SM5_OP_IMM_ATOMIC_AND = 0xb5,
282 WINED3D_SM5_OP_IMM_ATOMIC_OR = 0xb6,
283 WINED3D_SM5_OP_IMM_ATOMIC_XOR = 0xb7,
284 WINED3D_SM5_OP_IMM_ATOMIC_EXCH = 0xb8,
285 WINED3D_SM5_OP_IMM_ATOMIC_CMP_EXCH = 0xb9,
286 WINED3D_SM5_OP_IMM_ATOMIC_IMAX = 0xba,
287 WINED3D_SM5_OP_IMM_ATOMIC_UMAX = 0xbc,
288 WINED3D_SM5_OP_IMM_ATOMIC_UMIN = 0xbd,
289 WINED3D_SM5_OP_SYNC = 0xbe,
292 enum wined3d_sm4_register_type
294 WINED3D_SM4_RT_TEMP = 0x00,
295 WINED3D_SM4_RT_INPUT = 0x01,
296 WINED3D_SM4_RT_OUTPUT = 0x02,
297 WINED3D_SM4_RT_INDEXABLE_TEMP = 0x03,
298 WINED3D_SM4_RT_IMMCONST = 0x04,
299 WINED3D_SM4_RT_SAMPLER = 0x06,
300 WINED3D_SM4_RT_RESOURCE = 0x07,
301 WINED3D_SM4_RT_CONSTBUFFER = 0x08,
302 WINED3D_SM4_RT_IMMCONSTBUFFER = 0x09,
303 WINED3D_SM4_RT_PRIMID = 0x0b,
304 WINED3D_SM4_RT_DEPTHOUT = 0x0c,
305 WINED3D_SM4_RT_NULL = 0x0d,
306 WINED3D_SM4_RT_OMASK = 0x0f,
307 WINED3D_SM5_RT_STREAM = 0x10,
308 WINED3D_SM5_RT_FUNCTION_BODY = 0x11,
309 WINED3D_SM5_RT_FUNCTION_POINTER = 0x13,
310 WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID = 0x16,
311 WINED3D_SM5_RT_FORK_INSTANCE_ID = 0x17,
312 WINED3D_SM5_RT_INPUT_CONTROL_POINT = 0x19,
313 WINED3D_SM5_RT_OUTPUT_CONTROL_POINT = 0x1a,
314 WINED3D_SM5_RT_PATCH_CONSTANT_DATA = 0x1b,
315 WINED3D_SM5_RT_DOMAIN_LOCATION = 0x1c,
316 WINED3D_SM5_RT_UAV = 0x1e,
317 WINED3D_SM5_RT_SHARED_MEMORY = 0x1f,
318 WINED3D_SM5_RT_THREAD_ID = 0x20,
319 WINED3D_SM5_RT_THREAD_GROUP_ID = 0x21,
320 WINED3D_SM5_RT_LOCAL_THREAD_ID = 0x22,
321 WINED3D_SM5_RT_COVERAGE = 0x23,
322 WINED3D_SM5_RT_LOCAL_THREAD_INDEX = 0x24,
325 enum wined3d_sm4_output_primitive_type
327 WINED3D_SM4_OUTPUT_PT_POINTLIST = 0x1,
328 WINED3D_SM4_OUTPUT_PT_LINELIST = 0x3,
329 WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP = 0x5,
332 enum wined3d_sm4_input_primitive_type
334 WINED3D_SM4_INPUT_PT_POINT = 0x1,
335 WINED3D_SM4_INPUT_PT_LINE = 0x2,
336 WINED3D_SM4_INPUT_PT_TRIANGLE = 0x3,
337 WINED3D_SM4_INPUT_PT_LINEADJ = 0x6,
338 WINED3D_SM4_INPUT_PT_TRIANGLEADJ = 0x7,
341 enum wined3d_sm4_swizzle_type
343 WINED3D_SM4_SWIZZLE_NONE = 0x0,
344 WINED3D_SM4_SWIZZLE_VEC4 = 0x1,
345 WINED3D_SM4_SWIZZLE_SCALAR = 0x2,
348 enum wined3d_sm4_immconst_type
350 WINED3D_SM4_IMMCONST_SCALAR = 0x1,
351 WINED3D_SM4_IMMCONST_VEC4 = 0x2,
354 enum wined3d_sm4_resource_type
356 WINED3D_SM4_RESOURCE_BUFFER = 0x1,
357 WINED3D_SM4_RESOURCE_TEXTURE_1D = 0x2,
358 WINED3D_SM4_RESOURCE_TEXTURE_2D = 0x3,
359 WINED3D_SM4_RESOURCE_TEXTURE_2DMS = 0x4,
360 WINED3D_SM4_RESOURCE_TEXTURE_3D = 0x5,
361 WINED3D_SM4_RESOURCE_TEXTURE_CUBE = 0x6,
362 WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY = 0x7,
363 WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY = 0x8,
364 WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY = 0x9,
365 WINED3D_SM4_RESOURCE_TEXTURE_CUBEARRAY = 0xa,
368 enum wined3d_sm4_data_type
370 WINED3D_SM4_DATA_UNORM = 0x1,
371 WINED3D_SM4_DATA_SNORM = 0x2,
372 WINED3D_SM4_DATA_INT = 0x3,
373 WINED3D_SM4_DATA_UINT = 0x4,
374 WINED3D_SM4_DATA_FLOAT = 0x5,
377 enum wined3d_sm4_sampler_mode
379 WINED3D_SM4_SAMPLER_DEFAULT = 0x0,
380 WINED3D_SM4_SAMPLER_COMPARISON = 0x1,
383 enum wined3d_sm4_shader_data_type
385 WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER = 0x3,
386 WINED3D_SM4_SHADER_DATA_MESSAGE = 0x4,
389 struct wined3d_shader_src_param_entry
391 struct list entry;
392 struct wined3d_shader_src_param param;
395 struct wined3d_sm4_data
397 struct wined3d_shader_version shader_version;
398 const DWORD *end;
400 unsigned int output_map[MAX_REG_OUTPUT];
402 struct wined3d_shader_src_param src_param[5];
403 struct wined3d_shader_dst_param dst_param[2];
404 struct list src_free;
405 struct list src;
406 struct wined3d_shader_immediate_constant_buffer icb;
409 struct wined3d_sm4_opcode_info
411 enum wined3d_sm4_opcode opcode;
412 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
413 const char *dst_info;
414 const char *src_info;
415 void (*read_opcode_func)(struct wined3d_shader_instruction *ins,
416 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
417 struct wined3d_sm4_data *priv);
420 static const enum wined3d_primitive_type output_primitive_type_table[] =
422 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
423 /* WINED3D_SM4_OUTPUT_PT_POINTLIST */ WINED3D_PT_POINTLIST,
424 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
425 /* WINED3D_SM4_OUTPUT_PT_LINELIST */ WINED3D_PT_LINELIST,
426 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
427 /* WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP */ WINED3D_PT_TRIANGLESTRIP,
430 static const enum wined3d_primitive_type input_primitive_type_table[] =
432 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
433 /* WINED3D_SM4_INPUT_PT_POINT */ WINED3D_PT_POINTLIST,
434 /* WINED3D_SM4_INPUT_PT_LINE */ WINED3D_PT_LINELIST,
435 /* WINED3D_SM4_INPUT_PT_TRIANGLE */ WINED3D_PT_TRIANGLELIST,
436 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
437 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
438 /* WINED3D_SM4_INPUT_PT_LINEADJ */ WINED3D_PT_LINELIST_ADJ,
439 /* WINED3D_SM4_INPUT_PT_TRIANGLEADJ */ WINED3D_PT_TRIANGLELIST_ADJ,
442 static const enum wined3d_shader_resource_type resource_type_table[] =
444 /* 0 */ WINED3D_SHADER_RESOURCE_NONE,
445 /* WINED3D_SM4_RESOURCE_BUFFER */ WINED3D_SHADER_RESOURCE_BUFFER,
446 /* WINED3D_SM4_RESOURCE_TEXTURE_1D */ WINED3D_SHADER_RESOURCE_TEXTURE_1D,
447 /* WINED3D_SM4_RESOURCE_TEXTURE_2D */ WINED3D_SHADER_RESOURCE_TEXTURE_2D,
448 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMS */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMS,
449 /* WINED3D_SM4_RESOURCE_TEXTURE_3D */ WINED3D_SHADER_RESOURCE_TEXTURE_3D,
450 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBE */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBE,
451 /* WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_1DARRAY,
452 /* WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DARRAY,
453 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY,
454 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBEARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBEARRAY,
457 static const enum wined3d_data_type data_type_table[] =
459 /* 0 */ WINED3D_DATA_FLOAT,
460 /* WINED3D_SM4_DATA_UNORM */ WINED3D_DATA_UNORM,
461 /* WINED3D_SM4_DATA_SNORM */ WINED3D_DATA_SNORM,
462 /* WINED3D_SM4_DATA_INT */ WINED3D_DATA_INT,
463 /* WINED3D_SM4_DATA_UINT */ WINED3D_DATA_UINT,
464 /* WINED3D_SM4_DATA_FLOAT */ WINED3D_DATA_FLOAT,
467 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
468 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param);
469 static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
470 enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param);
472 static void shader_sm4_read_conditional_op(struct wined3d_shader_instruction *ins,
473 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
474 struct wined3d_sm4_data *priv)
476 shader_sm4_read_src_param(priv, &tokens, WINED3D_DATA_UINT, &priv->src_param[0]);
477 ins->flags = (opcode_token & WINED3D_SM4_CONDITIONAL_NZ) ?
478 WINED3D_SHADER_CONDITIONAL_OP_NZ : WINED3D_SHADER_CONDITIONAL_OP_Z;
481 static void shader_sm4_read_shader_data(struct wined3d_shader_instruction *ins,
482 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
483 struct wined3d_sm4_data *priv)
485 enum wined3d_sm4_shader_data_type type;
486 unsigned int icb_size;
488 type = (opcode_token & WINED3D_SM4_SHADER_DATA_TYPE_MASK) >> WINED3D_SM4_SHADER_DATA_TYPE_SHIFT;
489 if (type != WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER)
491 FIXME("Unhandled shader data type %#x.\n", type);
492 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
493 return;
496 ++tokens;
497 icb_size = token_count - 1;
498 if (icb_size % 4 || icb_size > MAX_IMMEDIATE_CONSTANT_BUFFER_SIZE)
500 FIXME("Unexpected immediate constant buffer size %u.\n", icb_size);
501 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
502 return;
505 priv->icb.vec4_count = icb_size / 4;
506 memcpy(priv->icb.data, tokens, sizeof(*tokens) * icb_size);
507 ins->declaration.icb = &priv->icb;
510 static void shader_sm4_read_dcl_resource(struct wined3d_shader_instruction *ins,
511 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
512 struct wined3d_sm4_data *priv)
514 enum wined3d_sm4_resource_type resource_type;
515 enum wined3d_sm4_data_type data_type;
516 enum wined3d_data_type reg_data_type;
517 DWORD components;
519 resource_type = (opcode_token & WINED3D_SM4_RESOURCE_TYPE_MASK) >> WINED3D_SM4_RESOURCE_TYPE_SHIFT;
520 if (!resource_type || (resource_type >= ARRAY_SIZE(resource_type_table)))
522 FIXME("Unhandled resource type %#x.\n", resource_type);
523 ins->declaration.semantic.resource_type = WINED3D_SHADER_RESOURCE_NONE;
525 else
527 ins->declaration.semantic.resource_type = resource_type_table[resource_type];
529 reg_data_type = opcode == WINED3D_SM4_OP_DCL_RESOURCE ? WINED3D_DATA_RESOURCE : WINED3D_DATA_UAV;
530 shader_sm4_read_dst_param(priv, &tokens, reg_data_type, &ins->declaration.semantic.reg);
532 components = *tokens++;
533 if ((components & 0xfff0) != (components & 0xf) * 0x1110)
534 FIXME("Components (%#x) have different data types.\n", components);
535 data_type = components & 0xf;
537 if (!data_type || (data_type >= ARRAY_SIZE(data_type_table)))
539 FIXME("Unhandled data type %#x.\n", data_type);
540 ins->declaration.semantic.resource_data_type = WINED3D_DATA_FLOAT;
542 else
544 ins->declaration.semantic.resource_data_type = data_type_table[data_type];
548 static void shader_sm4_read_dcl_constant_buffer(struct wined3d_shader_instruction *ins,
549 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
550 struct wined3d_sm4_data *priv)
552 shader_sm4_read_src_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.src);
553 if (opcode_token & WINED3D_SM4_INDEX_TYPE_MASK)
554 ins->flags |= WINED3DSI_INDEXED_DYNAMIC;
557 static void shader_sm4_read_dcl_sampler(struct wined3d_shader_instruction *ins,
558 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
559 struct wined3d_sm4_data *priv)
561 ins->flags = (opcode_token & WINED3D_SM4_SAMPLER_MODE_MASK) >> WINED3D_SM4_SAMPLER_MODE_SHIFT;
562 if (ins->flags & ~WINED3D_SM4_SAMPLER_COMPARISON)
563 FIXME("Unhandled sampler mode %#x.\n", ins->flags);
564 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_SAMPLER, &ins->declaration.dst);
567 static void shader_sm4_read_dcl_output_topology(struct wined3d_shader_instruction *ins,
568 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
569 struct wined3d_sm4_data *priv)
571 enum wined3d_sm4_output_primitive_type primitive_type;
573 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
574 if (primitive_type >= sizeof(output_primitive_type_table) / sizeof(*output_primitive_type_table))
576 FIXME("Unhandled output primitive type %#x.\n", primitive_type);
577 ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
579 else
581 ins->declaration.primitive_type = output_primitive_type_table[primitive_type];
585 static void shader_sm4_read_dcl_input_primitive(struct wined3d_shader_instruction *ins,
586 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
587 struct wined3d_sm4_data *priv)
589 enum wined3d_sm4_input_primitive_type primitive_type;
591 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
592 if (primitive_type >= sizeof(input_primitive_type_table) / sizeof(*input_primitive_type_table))
594 FIXME("Unhandled input primitive type %#x.\n", primitive_type);
595 ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
597 else
599 ins->declaration.primitive_type = input_primitive_type_table[primitive_type];
603 static void shader_sm4_read_declaration_count(struct wined3d_shader_instruction *ins,
604 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
605 struct wined3d_sm4_data *priv)
607 ins->declaration.count = *tokens;
610 static void shader_sm4_read_declaration_dst(struct wined3d_shader_instruction *ins,
611 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
612 struct wined3d_sm4_data *priv)
614 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.dst);
617 static void shader_sm4_read_declaration_register_semantic(struct wined3d_shader_instruction *ins,
618 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
619 struct wined3d_sm4_data *priv)
621 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.register_semantic.reg);
622 ins->declaration.register_semantic.sysval_semantic = *tokens;
625 static void shader_sm4_read_dcl_input_ps(struct wined3d_shader_instruction *ins,
626 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
627 struct wined3d_sm4_data *priv)
629 ins->flags = (opcode_token & WINED3D_SM4_INTERPOLATION_MODE_MASK) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT;
630 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.dst);
633 static void shader_sm4_read_dcl_input_ps_siv(struct wined3d_shader_instruction *ins,
634 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
635 struct wined3d_sm4_data *priv)
637 ins->flags = (opcode_token & WINED3D_SM4_INTERPOLATION_MODE_MASK) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT;
638 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.register_semantic.reg);
639 ins->declaration.register_semantic.sysval_semantic = *tokens;
642 static void shader_sm4_read_dcl_indexable_temp(struct wined3d_shader_instruction *ins,
643 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
644 struct wined3d_sm4_data *priv)
646 ins->declaration.indexable_temp.register_idx = *tokens++;
647 ins->declaration.indexable_temp.register_size = *tokens++;
648 ins->declaration.indexable_temp.component_count = *tokens;
651 static void shader_sm4_read_dcl_global_flags(struct wined3d_shader_instruction *ins,
652 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
653 struct wined3d_sm4_data *priv)
655 ins->flags = (opcode_token & WINED3D_SM4_GLOBAL_FLAGS_MASK) >> WINED3D_SM4_GLOBAL_FLAGS_SHIFT;
658 static void shader_sm5_read_fcall(struct wined3d_shader_instruction *ins,
659 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
660 struct wined3d_sm4_data *priv)
662 priv->src_param[0].reg.u.fp_body_idx = *tokens++;
663 shader_sm4_read_src_param(priv, &tokens, WINED3D_DATA_OPAQUE, &priv->src_param[0]);
666 static void shader_sm5_read_dcl_function_body(struct wined3d_shader_instruction *ins,
667 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
668 struct wined3d_sm4_data *priv)
670 ins->declaration.index = *tokens;
673 static void shader_sm5_read_dcl_function_table(struct wined3d_shader_instruction *ins,
674 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
675 struct wined3d_sm4_data *priv)
677 ins->declaration.index = *tokens++;
678 FIXME("Ignoring set of function bodies (count %u).\n", *tokens);
681 static void shader_sm5_read_dcl_interface(struct wined3d_shader_instruction *ins,
682 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
683 struct wined3d_sm4_data *priv)
685 ins->declaration.fp.index = *tokens++;
686 ins->declaration.fp.body_count = *tokens++;
687 ins->declaration.fp.array_size = *tokens >> WINED3D_SM5_FP_ARRAY_SIZE_SHIFT;
688 ins->declaration.fp.table_count = *tokens++ & WINED3D_SM5_FP_TABLE_COUNT_MASK;
689 FIXME("Ignoring set of function tables (count %u).\n", ins->declaration.fp.table_count);
692 static void shader_sm5_read_control_point_count(struct wined3d_shader_instruction *ins,
693 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
694 struct wined3d_sm4_data *priv)
696 ins->declaration.count = (opcode_token & WINED3D_SM5_CONTROL_POINT_COUNT_MASK)
697 >> WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT;
700 static void shader_sm5_read_dcl_tessellator_domain(struct wined3d_shader_instruction *ins,
701 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
702 struct wined3d_sm4_data *priv)
704 ins->declaration.tessellator_domain = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
705 >> WINED3D_SM5_TESSELLATOR_SHIFT;
708 static void shader_sm5_read_dcl_tessellator_partitioning(struct wined3d_shader_instruction *ins,
709 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
710 struct wined3d_sm4_data *priv)
712 ins->declaration.tessellator_partitioning = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
713 >> WINED3D_SM5_TESSELLATOR_SHIFT;
716 static void shader_sm5_read_dcl_tessellator_output_primitive(struct wined3d_shader_instruction *ins,
717 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
718 struct wined3d_sm4_data *priv)
720 ins->declaration.tessellator_output_primitive = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
721 >> WINED3D_SM5_TESSELLATOR_SHIFT;
724 static void shader_sm5_read_dcl_hs_max_tessfactor(struct wined3d_shader_instruction *ins,
725 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
726 struct wined3d_sm4_data *priv)
728 ins->declaration.max_tessellation_factor = *(float *)tokens;
731 static void shader_sm5_read_dcl_thread_group(struct wined3d_shader_instruction *ins,
732 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
733 struct wined3d_sm4_data *priv)
735 ins->declaration.thread_group_size.x = *tokens++;
736 ins->declaration.thread_group_size.y = *tokens++;
737 ins->declaration.thread_group_size.z = *tokens++;
740 static void shader_sm5_read_dcl_uav_raw(struct wined3d_shader_instruction *ins,
741 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
742 struct wined3d_sm4_data *priv)
744 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_UAV, &ins->declaration.dst);
745 ins->flags = (opcode_token & WINED3D_SM5_UAV_FLAGS_MASK) >> WINED3D_SM5_UAV_FLAGS_SHIFT;
748 static void shader_sm5_read_dcl_uav_structured(struct wined3d_shader_instruction *ins,
749 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
750 struct wined3d_sm4_data *priv)
752 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_UAV, &ins->declaration.structured_resource.reg);
753 ins->flags = (opcode_token & WINED3D_SM5_UAV_FLAGS_MASK) >> WINED3D_SM5_UAV_FLAGS_SHIFT;
754 ins->declaration.structured_resource.byte_stride = *tokens;
757 static void shader_sm5_read_dcl_tgsm_raw(struct wined3d_shader_instruction *ins,
758 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
759 struct wined3d_sm4_data *priv)
761 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.tgsm_raw.reg);
762 ins->declaration.tgsm_raw.byte_count = *tokens;
765 static void shader_sm5_read_dcl_tgsm_structured(struct wined3d_shader_instruction *ins,
766 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
767 struct wined3d_sm4_data *priv)
769 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_FLOAT, &ins->declaration.tgsm_structured.reg);
770 ins->declaration.tgsm_structured.byte_stride = *tokens++;
771 ins->declaration.tgsm_structured.structure_count = *tokens;
774 static void shader_sm5_read_dcl_resource_structured(struct wined3d_shader_instruction *ins,
775 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
776 struct wined3d_sm4_data *priv)
778 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_RESOURCE, &ins->declaration.structured_resource.reg);
779 ins->declaration.structured_resource.byte_stride = *tokens;
782 static void shader_sm5_read_dcl_resource_raw(struct wined3d_shader_instruction *ins,
783 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
784 struct wined3d_sm4_data *priv)
786 shader_sm4_read_dst_param(priv, &tokens, WINED3D_DATA_RESOURCE, &ins->declaration.dst);
789 static void shader_sm5_read_sync(struct wined3d_shader_instruction *ins,
790 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
791 struct wined3d_sm4_data *priv)
793 ins->flags = (opcode_token & WINED3D_SM5_SYNC_FLAGS_MASK) >> WINED3D_SM5_SYNC_FLAGS_SHIFT;
797 * f -> WINED3D_DATA_FLOAT
798 * i -> WINED3D_DATA_INT
799 * u -> WINED3D_DATA_UINT
800 * O -> WINED3D_DATA_OPAQUE
801 * R -> WINED3D_DATA_RESOURCE
802 * S -> WINED3D_DATA_SAMPLER
803 * U -> WINED3D_DATA_UAV
805 static const struct wined3d_sm4_opcode_info opcode_table[] =
807 {WINED3D_SM4_OP_ADD, WINED3DSIH_ADD, "f", "ff"},
808 {WINED3D_SM4_OP_AND, WINED3DSIH_AND, "u", "uu"},
809 {WINED3D_SM4_OP_BREAK, WINED3DSIH_BREAK, "", ""},
810 {WINED3D_SM4_OP_BREAKC, WINED3DSIH_BREAKP, "", "u",
811 shader_sm4_read_conditional_op},
812 {WINED3D_SM4_OP_CASE, WINED3DSIH_CASE, "", "u"},
813 {WINED3D_SM4_OP_CONTINUE, WINED3DSIH_CONTINUE, "", ""},
814 {WINED3D_SM4_OP_CUT, WINED3DSIH_CUT, "", ""},
815 {WINED3D_SM4_OP_DEFAULT, WINED3DSIH_DEFAULT, "", ""},
816 {WINED3D_SM4_OP_DERIV_RTX, WINED3DSIH_DSX, "f", "f"},
817 {WINED3D_SM4_OP_DERIV_RTY, WINED3DSIH_DSY, "f", "f"},
818 {WINED3D_SM4_OP_DISCARD, WINED3DSIH_TEXKILL, "", "u"},
819 {WINED3D_SM4_OP_DIV, WINED3DSIH_DIV, "f", "ff"},
820 {WINED3D_SM4_OP_DP2, WINED3DSIH_DP2, "f", "ff"},
821 {WINED3D_SM4_OP_DP3, WINED3DSIH_DP3, "f", "ff"},
822 {WINED3D_SM4_OP_DP4, WINED3DSIH_DP4, "f", "ff"},
823 {WINED3D_SM4_OP_ELSE, WINED3DSIH_ELSE, "", ""},
824 {WINED3D_SM4_OP_EMIT, WINED3DSIH_EMIT, "", ""},
825 {WINED3D_SM4_OP_ENDIF, WINED3DSIH_ENDIF, "", ""},
826 {WINED3D_SM4_OP_ENDLOOP, WINED3DSIH_ENDLOOP, "", ""},
827 {WINED3D_SM4_OP_ENDSWITCH, WINED3DSIH_ENDSWITCH, "", ""},
828 {WINED3D_SM4_OP_EQ, WINED3DSIH_EQ, "u", "ff"},
829 {WINED3D_SM4_OP_EXP, WINED3DSIH_EXP, "f", "f"},
830 {WINED3D_SM4_OP_FRC, WINED3DSIH_FRC, "f", "f"},
831 {WINED3D_SM4_OP_FTOI, WINED3DSIH_FTOI, "i", "f"},
832 {WINED3D_SM4_OP_FTOU, WINED3DSIH_FTOU, "u", "f"},
833 {WINED3D_SM4_OP_GE, WINED3DSIH_GE, "u", "ff"},
834 {WINED3D_SM4_OP_IADD, WINED3DSIH_IADD, "i", "ii"},
835 {WINED3D_SM4_OP_IF, WINED3DSIH_IF, "", "u",
836 shader_sm4_read_conditional_op},
837 {WINED3D_SM4_OP_IEQ, WINED3DSIH_IEQ, "u", "ii"},
838 {WINED3D_SM4_OP_IGE, WINED3DSIH_IGE, "u", "ii"},
839 {WINED3D_SM4_OP_ILT, WINED3DSIH_ILT, "u", "ii"},
840 {WINED3D_SM4_OP_IMAD, WINED3DSIH_IMAD, "i", "iii"},
841 {WINED3D_SM4_OP_IMAX, WINED3DSIH_IMAX, "i", "ii"},
842 {WINED3D_SM4_OP_IMIN, WINED3DSIH_IMIN, "i", "ii"},
843 {WINED3D_SM4_OP_IMUL, WINED3DSIH_IMUL, "ii", "ii"},
844 {WINED3D_SM4_OP_INE, WINED3DSIH_INE, "u", "ii"},
845 {WINED3D_SM4_OP_INEG, WINED3DSIH_INEG, "i", "i"},
846 {WINED3D_SM4_OP_ISHL, WINED3DSIH_ISHL, "i", "ii"},
847 {WINED3D_SM4_OP_ISHR, WINED3DSIH_ISHR, "i", "ii"},
848 {WINED3D_SM4_OP_ITOF, WINED3DSIH_ITOF, "f", "i"},
849 {WINED3D_SM4_OP_LABEL, WINED3DSIH_LABEL, "", "O"},
850 {WINED3D_SM4_OP_LD, WINED3DSIH_LD, "u", "iR"},
851 {WINED3D_SM4_OP_LD2DMS, WINED3DSIH_LD2DMS, "u", "iRi"},
852 {WINED3D_SM4_OP_LOG, WINED3DSIH_LOG, "f", "f"},
853 {WINED3D_SM4_OP_LOOP, WINED3DSIH_LOOP, "", ""},
854 {WINED3D_SM4_OP_LT, WINED3DSIH_LT, "u", "ff"},
855 {WINED3D_SM4_OP_MAD, WINED3DSIH_MAD, "f", "fff"},
856 {WINED3D_SM4_OP_MIN, WINED3DSIH_MIN, "f", "ff"},
857 {WINED3D_SM4_OP_MAX, WINED3DSIH_MAX, "f", "ff"},
858 {WINED3D_SM4_OP_SHADER_DATA, WINED3DSIH_DCL_IMMEDIATE_CONSTANT_BUFFER, "", "",
859 shader_sm4_read_shader_data},
860 {WINED3D_SM4_OP_MOV, WINED3DSIH_MOV, "f", "f"},
861 {WINED3D_SM4_OP_MOVC, WINED3DSIH_MOVC, "f", "uff"},
862 {WINED3D_SM4_OP_MUL, WINED3DSIH_MUL, "f", "ff"},
863 {WINED3D_SM4_OP_NE, WINED3DSIH_NE, "u", "ff"},
864 {WINED3D_SM4_OP_NOT, WINED3DSIH_NOT, "u", "u"},
865 {WINED3D_SM4_OP_OR, WINED3DSIH_OR, "u", "uu"},
866 {WINED3D_SM4_OP_RESINFO, WINED3DSIH_RESINFO, "f", "iR"},
867 {WINED3D_SM4_OP_RET, WINED3DSIH_RET, "", ""},
868 {WINED3D_SM4_OP_ROUND_NE, WINED3DSIH_ROUND_NE, "f", "f"},
869 {WINED3D_SM4_OP_ROUND_NI, WINED3DSIH_ROUND_NI, "f", "f"},
870 {WINED3D_SM4_OP_ROUND_PI, WINED3DSIH_ROUND_PI, "f", "f"},
871 {WINED3D_SM4_OP_ROUND_Z, WINED3DSIH_ROUND_Z, "f", "f"},
872 {WINED3D_SM4_OP_RSQ, WINED3DSIH_RSQ, "f", "f"},
873 {WINED3D_SM4_OP_SAMPLE, WINED3DSIH_SAMPLE, "u", "fRS"},
874 {WINED3D_SM4_OP_SAMPLE_C, WINED3DSIH_SAMPLE_C, "f", "fRSf"},
875 {WINED3D_SM4_OP_SAMPLE_C_LZ, WINED3DSIH_SAMPLE_C_LZ, "f", "fRSf"},
876 {WINED3D_SM4_OP_SAMPLE_LOD, WINED3DSIH_SAMPLE_LOD, "u", "fRSf"},
877 {WINED3D_SM4_OP_SAMPLE_GRAD, WINED3DSIH_SAMPLE_GRAD, "u", "fRSff"},
878 {WINED3D_SM4_OP_SAMPLE_B, WINED3DSIH_SAMPLE_B, "u", "fRSf"},
879 {WINED3D_SM4_OP_SQRT, WINED3DSIH_SQRT, "f", "f"},
880 {WINED3D_SM4_OP_SWITCH, WINED3DSIH_SWITCH, "", "u"},
881 {WINED3D_SM4_OP_SINCOS, WINED3DSIH_SINCOS, "ff", "f"},
882 {WINED3D_SM4_OP_UDIV, WINED3DSIH_UDIV, "uu", "uu"},
883 {WINED3D_SM4_OP_ULT, WINED3DSIH_ULT, "u", "uu"},
884 {WINED3D_SM4_OP_UGE, WINED3DSIH_UGE, "u", "uu"},
885 {WINED3D_SM4_OP_UMAX, WINED3DSIH_UMAX, "u", "uu"},
886 {WINED3D_SM4_OP_UMIN, WINED3DSIH_UMIN, "u", "uu"},
887 {WINED3D_SM4_OP_USHR, WINED3DSIH_USHR, "u", "uu"},
888 {WINED3D_SM4_OP_UTOF, WINED3DSIH_UTOF, "f", "u"},
889 {WINED3D_SM4_OP_XOR, WINED3DSIH_XOR, "u", "uu"},
890 {WINED3D_SM4_OP_DCL_RESOURCE, WINED3DSIH_DCL, "R", "",
891 shader_sm4_read_dcl_resource},
892 {WINED3D_SM4_OP_DCL_CONSTANT_BUFFER, WINED3DSIH_DCL_CONSTANT_BUFFER, "", "",
893 shader_sm4_read_dcl_constant_buffer},
894 {WINED3D_SM4_OP_DCL_SAMPLER, WINED3DSIH_DCL_SAMPLER, "", "",
895 shader_sm4_read_dcl_sampler},
896 {WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY, WINED3DSIH_DCL_OUTPUT_TOPOLOGY, "", "",
897 shader_sm4_read_dcl_output_topology},
898 {WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE, WINED3DSIH_DCL_INPUT_PRIMITIVE, "", "",
899 shader_sm4_read_dcl_input_primitive},
900 {WINED3D_SM4_OP_DCL_VERTICES_OUT, WINED3DSIH_DCL_VERTICES_OUT, "", "",
901 shader_sm4_read_declaration_count},
902 {WINED3D_SM4_OP_DCL_INPUT, WINED3DSIH_DCL_INPUT, "", "",
903 shader_sm4_read_declaration_dst},
904 {WINED3D_SM4_OP_DCL_INPUT_SGV, WINED3DSIH_DCL_INPUT_SGV, "", "",
905 shader_sm4_read_declaration_register_semantic},
906 {WINED3D_SM4_OP_DCL_INPUT_SIV, WINED3DSIH_DCL_INPUT_SIV, "", "",
907 shader_sm4_read_declaration_register_semantic},
908 {WINED3D_SM4_OP_DCL_INPUT_PS, WINED3DSIH_DCL_INPUT_PS, "", "",
909 shader_sm4_read_dcl_input_ps},
910 {WINED3D_SM4_OP_DCL_INPUT_PS_SGV, WINED3DSIH_DCL_INPUT_PS_SGV, "", "",
911 shader_sm4_read_declaration_register_semantic},
912 {WINED3D_SM4_OP_DCL_INPUT_PS_SIV, WINED3DSIH_DCL_INPUT_PS_SIV, "", "",
913 shader_sm4_read_dcl_input_ps_siv},
914 {WINED3D_SM4_OP_DCL_OUTPUT, WINED3DSIH_DCL_OUTPUT, "", "",
915 shader_sm4_read_declaration_dst},
916 {WINED3D_SM4_OP_DCL_OUTPUT_SIV, WINED3DSIH_DCL_OUTPUT_SIV, "", "",
917 shader_sm4_read_declaration_register_semantic},
918 {WINED3D_SM4_OP_DCL_TEMPS, WINED3DSIH_DCL_TEMPS, "", "",
919 shader_sm4_read_declaration_count},
920 {WINED3D_SM4_OP_DCL_INDEXABLE_TEMP, WINED3DSIH_DCL_INDEXABLE_TEMP, "", "",
921 shader_sm4_read_dcl_indexable_temp},
922 {WINED3D_SM4_OP_DCL_GLOBAL_FLAGS, WINED3DSIH_DCL_GLOBAL_FLAGS, "", "",
923 shader_sm4_read_dcl_global_flags},
924 {WINED3D_SM4_OP_LOD, WINED3DSIH_LOD, "f", "fRS"},
925 {WINED3D_SM4_OP_GATHER4, WINED3DSIH_GATHER4, "u", "fRS"},
926 {WINED3D_SM4_OP_SAMPLE_POS, WINED3DSIH_SAMPLE_POS, "f", "Ru"},
927 {WINED3D_SM4_OP_SAMPLE_INFO, WINED3DSIH_SAMPLE_INFO, "f", "R"},
928 {WINED3D_SM5_OP_HS_DECLS, WINED3DSIH_HS_DECLS, "", ""},
929 {WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE, WINED3DSIH_HS_CONTROL_POINT_PHASE, "", ""},
930 {WINED3D_SM5_OP_HS_FORK_PHASE, WINED3DSIH_HS_FORK_PHASE, "", ""},
931 {WINED3D_SM5_OP_HS_JOIN_PHASE, WINED3DSIH_HS_JOIN_PHASE, "", ""},
932 {WINED3D_SM5_OP_EMIT_STREAM, WINED3DSIH_EMIT_STREAM, "", "f"},
933 {WINED3D_SM5_OP_CUT_STREAM, WINED3DSIH_CUT_STREAM, "", "f"},
934 {WINED3D_SM5_OP_FCALL, WINED3DSIH_FCALL, "", "O",
935 shader_sm5_read_fcall},
936 {WINED3D_SM5_OP_BUFINFO, WINED3DSIH_BUFINFO, "i", "U"},
937 {WINED3D_SM5_OP_DERIV_RTX_COARSE, WINED3DSIH_DSX_COARSE, "f", "f"},
938 {WINED3D_SM5_OP_DERIV_RTX_FINE, WINED3DSIH_DSX_FINE, "f", "f"},
939 {WINED3D_SM5_OP_DERIV_RTY_COARSE, WINED3DSIH_DSY_COARSE, "f", "f"},
940 {WINED3D_SM5_OP_DERIV_RTY_FINE, WINED3DSIH_DSY_FINE, "f", "f"},
941 {WINED3D_SM5_OP_GATHER4_C, WINED3DSIH_GATHER4_C, "f", "fRSf"},
942 {WINED3D_SM5_OP_RCP, WINED3DSIH_RCP, "f", "f"},
943 {WINED3D_SM5_OP_F32TOF16, WINED3DSIH_F32TOF16, "u", "f"},
944 {WINED3D_SM5_OP_F16TOF32, WINED3DSIH_F16TOF32, "f", "u"},
945 {WINED3D_SM5_OP_COUNTBITS, WINED3DSIH_COUNTBITS, "u", "u"},
946 {WINED3D_SM5_OP_FIRSTBIT_HI, WINED3DSIH_FIRSTBIT_HI, "u", "u"},
947 {WINED3D_SM5_OP_FIRSTBIT_LO, WINED3DSIH_FIRSTBIT_LO, "u", "u"},
948 {WINED3D_SM5_OP_FIRSTBIT_SHI, WINED3DSIH_FIRSTBIT_SHI, "u", "i"},
949 {WINED3D_SM5_OP_UBFE, WINED3DSIH_UBFE, "u", "iiu"},
950 {WINED3D_SM5_OP_BFI, WINED3DSIH_BFI, "u", "iiuu"},
951 {WINED3D_SM5_OP_BFREV, WINED3DSIH_BFREV, "u", "u"},
952 {WINED3D_SM5_OP_SWAPC, WINED3DSIH_SWAPC, "ff", "uff"},
953 {WINED3D_SM5_OP_DCL_STREAM, WINED3DSIH_DCL_STREAM, "", "O"},
954 {WINED3D_SM5_OP_DCL_FUNCTION_BODY, WINED3DSIH_DCL_FUNCTION_BODY, "", "",
955 shader_sm5_read_dcl_function_body},
956 {WINED3D_SM5_OP_DCL_FUNCTION_TABLE, WINED3DSIH_DCL_FUNCTION_TABLE, "", "",
957 shader_sm5_read_dcl_function_table},
958 {WINED3D_SM5_OP_DCL_INTERFACE, WINED3DSIH_DCL_INTERFACE, "", "",
959 shader_sm5_read_dcl_interface},
960 {WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT, WINED3DSIH_DCL_INPUT_CONTROL_POINT_COUNT, "", "",
961 shader_sm5_read_control_point_count},
962 {WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT, WINED3DSIH_DCL_OUTPUT_CONTROL_POINT_COUNT, "", "",
963 shader_sm5_read_control_point_count},
964 {WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN, WINED3DSIH_DCL_TESSELLATOR_DOMAIN, "", "",
965 shader_sm5_read_dcl_tessellator_domain},
966 {WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING, WINED3DSIH_DCL_TESSELLATOR_PARTITIONING, "", "",
967 shader_sm5_read_dcl_tessellator_partitioning},
968 {WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, WINED3DSIH_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, "", "",
969 shader_sm5_read_dcl_tessellator_output_primitive},
970 {WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR, WINED3DSIH_DCL_HS_MAX_TESSFACTOR, "", "",
971 shader_sm5_read_dcl_hs_max_tessfactor},
972 {WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT, WINED3DSIH_DCL_HS_FORK_PHASE_INSTANCE_COUNT, "", "",
973 shader_sm4_read_declaration_count},
974 {WINED3D_SM5_OP_DCL_THREAD_GROUP, WINED3DSIH_DCL_THREAD_GROUP, "", "",
975 shader_sm5_read_dcl_thread_group},
976 {WINED3D_SM5_OP_DCL_UAV_TYPED, WINED3DSIH_DCL_UAV_TYPED, "", "",
977 shader_sm4_read_dcl_resource},
978 {WINED3D_SM5_OP_DCL_UAV_RAW, WINED3DSIH_DCL_UAV_RAW, "", "",
979 shader_sm5_read_dcl_uav_raw},
980 {WINED3D_SM5_OP_DCL_UAV_STRUCTURED, WINED3DSIH_DCL_UAV_STRUCTURED, "", "",
981 shader_sm5_read_dcl_uav_structured},
982 {WINED3D_SM5_OP_DCL_TGSM_RAW, WINED3DSIH_DCL_TGSM_RAW, "", "",
983 shader_sm5_read_dcl_tgsm_raw},
984 {WINED3D_SM5_OP_DCL_TGSM_STRUCTURED, WINED3DSIH_DCL_TGSM_STRUCTURED, "", "",
985 shader_sm5_read_dcl_tgsm_structured},
986 {WINED3D_SM5_OP_DCL_RESOURCE_RAW, WINED3DSIH_DCL_RESOURCE_RAW, "", "",
987 shader_sm5_read_dcl_resource_raw},
988 {WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED, WINED3DSIH_DCL_RESOURCE_STRUCTURED, "", "",
989 shader_sm5_read_dcl_resource_structured},
990 {WINED3D_SM5_OP_LD_UAV_TYPED, WINED3DSIH_LD_UAV_TYPED, "u", "iU"},
991 {WINED3D_SM5_OP_STORE_UAV_TYPED, WINED3DSIH_STORE_UAV_TYPED, "U", "iu"},
992 {WINED3D_SM5_OP_LD_RAW, WINED3DSIH_LD_RAW, "u", "iU"},
993 {WINED3D_SM5_OP_STORE_RAW, WINED3DSIH_STORE_RAW, "U", "iu"},
994 {WINED3D_SM5_OP_LD_STRUCTURED, WINED3DSIH_LD_STRUCTURED, "u", "iiR"},
995 {WINED3D_SM5_OP_STORE_STRUCTURED, WINED3DSIH_STORE_STRUCTURED, "U", "iiu"},
996 {WINED3D_SM5_OP_ATOMIC_AND, WINED3DSIH_ATOMIC_AND, "U", "iu"},
997 {WINED3D_SM5_OP_ATOMIC_OR, WINED3DSIH_ATOMIC_OR, "U", "iu"},
998 {WINED3D_SM5_OP_ATOMIC_XOR, WINED3DSIH_ATOMIC_XOR, "U", "iu"},
999 {WINED3D_SM5_OP_ATOMIC_CMP_STORE, WINED3DSIH_ATOMIC_CMP_STORE, "U", "iuu"},
1000 {WINED3D_SM5_OP_ATOMIC_IADD, WINED3DSIH_ATOMIC_IADD, "U", "ii"},
1001 {WINED3D_SM5_OP_ATOMIC_IMAX, WINED3DSIH_ATOMIC_IMAX, "U", "ii"},
1002 {WINED3D_SM5_OP_ATOMIC_IMIN, WINED3DSIH_ATOMIC_IMIN, "U", "ii"},
1003 {WINED3D_SM5_OP_ATOMIC_UMAX, WINED3DSIH_ATOMIC_UMAX, "U", "iu"},
1004 {WINED3D_SM5_OP_ATOMIC_UMIN, WINED3DSIH_ATOMIC_UMIN, "U", "iu"},
1005 {WINED3D_SM5_OP_IMM_ATOMIC_ALLOC, WINED3DSIH_IMM_ATOMIC_ALLOC, "u", "U"},
1006 {WINED3D_SM5_OP_IMM_ATOMIC_CONSUME, WINED3DSIH_IMM_ATOMIC_CONSUME, "u", "U"},
1007 {WINED3D_SM5_OP_IMM_ATOMIC_IADD, WINED3DSIH_IMM_ATOMIC_IADD, "uU", "ii"},
1008 {WINED3D_SM5_OP_IMM_ATOMIC_AND, WINED3DSIH_IMM_ATOMIC_AND, "uU", "iu"},
1009 {WINED3D_SM5_OP_IMM_ATOMIC_OR, WINED3DSIH_IMM_ATOMIC_OR, "uU", "iu"},
1010 {WINED3D_SM5_OP_IMM_ATOMIC_XOR, WINED3DSIH_IMM_ATOMIC_XOR, "uU", "iu"},
1011 {WINED3D_SM5_OP_IMM_ATOMIC_EXCH, WINED3DSIH_IMM_ATOMIC_EXCH, "uU", "iu"},
1012 {WINED3D_SM5_OP_IMM_ATOMIC_CMP_EXCH, WINED3DSIH_IMM_ATOMIC_CMP_EXCH, "uU", "iuu"},
1013 {WINED3D_SM5_OP_IMM_ATOMIC_IMAX, WINED3DSIH_IMM_ATOMIC_IMAX, "iU", "ii"},
1014 {WINED3D_SM5_OP_IMM_ATOMIC_UMAX, WINED3DSIH_IMM_ATOMIC_UMAX, "uU", "iu"},
1015 {WINED3D_SM5_OP_IMM_ATOMIC_UMIN, WINED3DSIH_IMM_ATOMIC_UMIN, "uU", "iu"},
1016 {WINED3D_SM5_OP_SYNC, WINED3DSIH_SYNC, "", "",
1017 shader_sm5_read_sync},
1020 static const enum wined3d_shader_register_type register_type_table[] =
1022 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP,
1023 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT,
1024 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT,
1025 /* WINED3D_SM4_RT_INDEXABLE_TEMP */ WINED3DSPR_IDXTEMP,
1026 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST,
1027 /* UNKNOWN */ ~0u,
1028 /* WINED3D_SM4_RT_SAMPLER */ WINED3DSPR_SAMPLER,
1029 /* WINED3D_SM4_RT_RESOURCE */ WINED3DSPR_RESOURCE,
1030 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER,
1031 /* WINED3D_SM4_RT_IMMCONSTBUFFER */ WINED3DSPR_IMMCONSTBUFFER,
1032 /* UNKNOWN */ ~0u,
1033 /* WINED3D_SM4_RT_PRIMID */ WINED3DSPR_PRIMID,
1034 /* WINED3D_SM4_RT_DEPTHOUT */ WINED3DSPR_DEPTHOUT,
1035 /* WINED3D_SM4_RT_NULL */ WINED3DSPR_NULL,
1036 /* UNKNOWN */ ~0u,
1037 /* WINED3D_SM4_RT_OMASK */ WINED3DSPR_SAMPLEMASK,
1038 /* WINED3D_SM5_RT_STREAM */ WINED3DSPR_STREAM,
1039 /* WINED3D_SM5_RT_FUNCTION_BODY */ WINED3DSPR_FUNCTIONBODY,
1040 /* UNKNOWN */ ~0u,
1041 /* WINED3D_SM5_RT_FUNCTION_POINTER */ WINED3DSPR_FUNCTIONPOINTER,
1042 /* UNKNOWN */ ~0u,
1043 /* UNKNOWN */ ~0u,
1044 /* WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID */ WINED3DSPR_OUTPOINTID,
1045 /* WINED3D_SM5_RT_FORK_INSTANCE_ID */ WINED3DSPR_FORKINSTID,
1046 /* UNKNOWN */ ~0u,
1047 /* WINED3D_SM5_RT_INPUT_CONTROL_POINT */ WINED3DSPR_INCONTROLPOINT,
1048 /* WINED3D_SM5_RT_OUTPUT_CONTROL_POINT */ WINED3DSPR_OUTCONTROLPOINT,
1049 /* WINED3D_SM5_RT_PATCH_CONSTANT_DATA */ WINED3DSPR_PATCHCONST,
1050 /* WINED3D_SM5_RT_DOMAIN_LOCATION */ WINED3DSPR_TESSCOORD,
1051 /* UNKNOWN */ ~0u,
1052 /* WINED3D_SM5_RT_UAV */ WINED3DSPR_UAV,
1053 /* WINED3D_SM5_RT_SHARED_MEMORY */ WINED3DSPR_GROUPSHAREDMEM,
1054 /* WINED3D_SM5_RT_THREAD_ID */ WINED3DSPR_THREADID,
1055 /* WINED3D_SM5_RT_THREAD_GROUP_ID */ WINED3DSPR_THREADGROUPID,
1056 /* WINED3D_SM5_RT_LOCAL_THREAD_ID */ WINED3DSPR_LOCALTHREADID,
1057 /* WINED3D_SM5_RT_COVERAGE */ WINED3DSPR_COVERAGE,
1058 /* WINED3D_SM5_RT_LOCAL_THREAD_INDEX */ WINED3DSPR_LOCALTHREADINDEX,
1061 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
1063 unsigned int i;
1065 for (i = 0; i < sizeof(opcode_table) / sizeof(*opcode_table); ++i)
1067 if (opcode == opcode_table[i].opcode) return &opcode_table[i];
1070 return NULL;
1073 static void map_register(const struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
1075 switch (priv->shader_version.type)
1077 case WINED3D_SHADER_TYPE_PIXEL:
1078 if (reg->type == WINED3DSPR_OUTPUT)
1080 unsigned int reg_idx = reg->idx[0].offset;
1082 if (reg_idx >= ARRAY_SIZE(priv->output_map))
1084 ERR("Invalid output index %u.\n", reg_idx);
1085 break;
1088 reg->type = WINED3DSPR_COLOROUT;
1089 reg->idx[0].offset = priv->output_map[reg_idx];
1091 break;
1093 default:
1094 break;
1098 static enum wined3d_data_type map_data_type(char t)
1100 switch (t)
1102 case 'f':
1103 return WINED3D_DATA_FLOAT;
1104 case 'i':
1105 return WINED3D_DATA_INT;
1106 case 'u':
1107 return WINED3D_DATA_UINT;
1108 case 'O':
1109 return WINED3D_DATA_OPAQUE;
1110 case 'R':
1111 return WINED3D_DATA_RESOURCE;
1112 case 'S':
1113 return WINED3D_DATA_SAMPLER;
1114 case 'U':
1115 return WINED3D_DATA_UAV;
1116 default:
1117 ERR("Invalid data type '%c'.\n", t);
1118 return WINED3D_DATA_FLOAT;
1122 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
1124 struct wined3d_sm4_data *priv;
1125 unsigned int i;
1127 if (!(priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv))))
1129 ERR("Failed to allocate private data\n");
1130 return NULL;
1133 memset(priv->output_map, 0xff, sizeof(priv->output_map));
1134 for (i = 0; i < output_signature->element_count; ++i)
1136 struct wined3d_shader_signature_element *e = &output_signature->elements[i];
1138 if (e->register_idx >= ARRAY_SIZE(priv->output_map))
1140 WARN("Invalid output index %u.\n", e->register_idx);
1141 continue;
1144 priv->output_map[e->register_idx] = e->semantic_idx;
1147 list_init(&priv->src_free);
1148 list_init(&priv->src);
1150 return priv;
1153 static void shader_sm4_free(void *data)
1155 struct wined3d_shader_src_param_entry *e1, *e2;
1156 struct wined3d_sm4_data *priv = data;
1158 list_move_head(&priv->src_free, &priv->src);
1159 LIST_FOR_EACH_ENTRY_SAFE(e1, e2, &priv->src_free, struct wined3d_shader_src_param_entry, entry)
1161 HeapFree(GetProcessHeap(), 0, e1);
1163 HeapFree(GetProcessHeap(), 0, priv);
1166 static struct wined3d_shader_src_param *get_src_param(struct wined3d_sm4_data *priv)
1168 struct wined3d_shader_src_param_entry *e;
1169 struct list *elem;
1171 if (!list_empty(&priv->src_free))
1173 elem = list_head(&priv->src_free);
1174 list_remove(elem);
1176 else
1178 if (!(e = HeapAlloc(GetProcessHeap(), 0, sizeof(*e))))
1179 return NULL;
1180 elem = &e->entry;
1183 list_add_tail(&priv->src, elem);
1184 e = LIST_ENTRY(elem, struct wined3d_shader_src_param_entry, entry);
1185 return &e->param;
1188 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
1190 struct wined3d_sm4_data *priv = data;
1191 DWORD version_token;
1193 priv->end = *ptr;
1195 version_token = *(*ptr)++;
1196 TRACE("Version: 0x%08x.\n", version_token);
1198 TRACE("Token count: %u.\n", **ptr);
1199 priv->end += *(*ptr)++;
1201 switch (version_token >> 16)
1203 case WINED3D_SM4_PS:
1204 priv->shader_version.type = WINED3D_SHADER_TYPE_PIXEL;
1205 break;
1207 case WINED3D_SM4_VS:
1208 priv->shader_version.type = WINED3D_SHADER_TYPE_VERTEX;
1209 break;
1211 case WINED3D_SM4_GS:
1212 priv->shader_version.type = WINED3D_SHADER_TYPE_GEOMETRY;
1213 break;
1215 case WINED3D_SM5_HS:
1216 priv->shader_version.type = WINED3D_SHADER_TYPE_HULL;
1217 break;
1219 case WINED3D_SM5_DS:
1220 priv->shader_version.type = WINED3D_SHADER_TYPE_DOMAIN;
1221 break;
1223 case WINED3D_SM5_CS:
1224 priv->shader_version.type = WINED3D_SHADER_TYPE_COMPUTE;
1225 break;
1227 default:
1228 FIXME("Unrecognized shader type %#x.\n", version_token >> 16);
1230 priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
1231 priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
1233 *shader_version = priv->shader_version;
1236 static BOOL shader_sm4_read_reg_idx(struct wined3d_sm4_data *priv, const DWORD **ptr,
1237 DWORD addressing, struct wined3d_shader_register_index *reg_idx)
1239 if (addressing & WINED3D_SM4_ADDRESSING_RELATIVE)
1241 struct wined3d_shader_src_param *rel_addr = get_src_param(priv);
1243 if (!(reg_idx->rel_addr = rel_addr))
1245 ERR("Failed to get src param for relative addressing.\n");
1246 return FALSE;
1249 if (addressing & WINED3D_SM4_ADDRESSING_OFFSET)
1250 reg_idx->offset = *(*ptr)++;
1251 else
1252 reg_idx->offset = 0;
1253 shader_sm4_read_src_param(priv, ptr, WINED3D_DATA_INT, rel_addr);
1255 else
1257 reg_idx->rel_addr = NULL;
1258 reg_idx->offset = *(*ptr)++;
1261 return TRUE;
1264 static BOOL shader_sm4_read_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
1265 enum wined3d_data_type data_type, struct wined3d_shader_register *param,
1266 enum wined3d_shader_src_modifier *modifier)
1268 enum wined3d_sm4_register_type register_type;
1269 DWORD token = *(*ptr)++;
1270 DWORD order;
1272 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
1273 if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table)
1274 || register_type_table[register_type] == ~0u)
1276 FIXME("Unhandled register type %#x.\n", register_type);
1277 param->type = WINED3DSPR_TEMP;
1279 else
1281 param->type = register_type_table[register_type];
1283 param->data_type = data_type;
1285 if (token & WINED3D_SM4_REGISTER_MODIFIER)
1287 DWORD m = *(*ptr)++;
1289 switch (m)
1291 case 0x41:
1292 *modifier = WINED3DSPSM_NEG;
1293 break;
1295 case 0x81:
1296 *modifier = WINED3DSPSM_ABS;
1297 break;
1299 case 0xc1:
1300 *modifier = WINED3DSPSM_ABSNEG;
1301 break;
1303 default:
1304 FIXME("Skipping modifier 0x%08x.\n", m);
1305 *modifier = WINED3DSPSM_NONE;
1306 break;
1309 else
1311 *modifier = WINED3DSPSM_NONE;
1314 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
1316 if (order < 1)
1317 param->idx[0].offset = ~0U;
1318 else
1320 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK0) >> WINED3D_SM4_ADDRESSING_SHIFT0;
1321 if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[0])))
1323 ERR("Failed to read register index.\n");
1324 return FALSE;
1328 if (order < 2)
1329 param->idx[1].offset = ~0U;
1330 else
1332 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK1) >> WINED3D_SM4_ADDRESSING_SHIFT1;
1333 if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[1])))
1335 ERR("Failed to read register index.\n");
1336 return FALSE;
1340 if (order > 2)
1341 FIXME("Unhandled order %u.\n", order);
1343 if (register_type == WINED3D_SM4_RT_IMMCONST)
1345 enum wined3d_sm4_immconst_type immconst_type =
1346 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
1348 switch (immconst_type)
1350 case WINED3D_SM4_IMMCONST_SCALAR:
1351 param->immconst_type = WINED3D_IMMCONST_SCALAR;
1352 memcpy(param->u.immconst_data, *ptr, 1 * sizeof(DWORD));
1353 *ptr += 1;
1354 break;
1356 case WINED3D_SM4_IMMCONST_VEC4:
1357 param->immconst_type = WINED3D_IMMCONST_VEC4;
1358 memcpy(param->u.immconst_data, *ptr, 4 * sizeof(DWORD));
1359 *ptr += 4;
1360 break;
1362 default:
1363 FIXME("Unhandled immediate constant type %#x.\n", immconst_type);
1364 break;
1368 map_register(priv, param);
1370 return TRUE;
1373 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
1374 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param)
1376 DWORD token = **ptr;
1378 if (!shader_sm4_read_param(priv, ptr, data_type, &src_param->reg, &src_param->modifiers))
1380 ERR("Failed to read parameter.\n");
1381 return FALSE;
1384 if (src_param->reg.type == WINED3DSPR_IMMCONST)
1386 src_param->swizzle = WINED3DSP_NOSWIZZLE;
1388 else
1390 enum wined3d_sm4_swizzle_type swizzle_type =
1391 (token & WINED3D_SM4_SWIZZLE_TYPE_MASK) >> WINED3D_SM4_SWIZZLE_TYPE_SHIFT;
1393 switch (swizzle_type)
1395 case WINED3D_SM4_SWIZZLE_NONE:
1396 src_param->swizzle = WINED3DSP_NOSWIZZLE;
1397 break;
1399 case WINED3D_SM4_SWIZZLE_SCALAR:
1400 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
1401 src_param->swizzle = (src_param->swizzle & 0x3) * 0x55;
1402 break;
1404 case WINED3D_SM4_SWIZZLE_VEC4:
1405 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
1406 break;
1408 default:
1409 FIXME("Unhandled swizzle type %#x.\n", swizzle_type);
1410 break;
1414 return TRUE;
1417 static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
1418 enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param)
1420 enum wined3d_shader_src_modifier modifier;
1421 DWORD token = **ptr;
1423 if (!shader_sm4_read_param(priv, ptr, data_type, &dst_param->reg, &modifier))
1425 ERR("Failed to read parameter.\n");
1426 return FALSE;
1429 if (modifier != WINED3DSPSM_NONE)
1431 ERR("Invalid source modifier %#x on destination register.\n", modifier);
1432 return FALSE;
1435 dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
1436 dst_param->modifiers = 0;
1437 dst_param->shift = 0;
1439 return TRUE;
1442 static void shader_sm4_read_instruction_modifier(DWORD modifier, struct wined3d_shader_instruction *ins)
1444 static const DWORD recognized_bits = WINED3D_SM4_INSTRUCTION_MODIFIER
1445 | WINED3D_SM4_MODIFIER_AOFFIMMI
1446 | WINED3D_SM4_AOFFIMMI_U_MASK
1447 | WINED3D_SM4_AOFFIMMI_V_MASK
1448 | WINED3D_SM4_AOFFIMMI_W_MASK;
1450 if (modifier & ~recognized_bits)
1452 FIXME("Unhandled modifier 0x%08x.\n", modifier);
1454 else
1456 /* Bit fields are used for sign extension */
1457 struct
1459 int u : 4;
1460 int v : 4;
1461 int w : 4;
1463 aoffimmi;
1464 aoffimmi.u = (modifier & WINED3D_SM4_AOFFIMMI_U_MASK) >> WINED3D_SM4_AOFFIMMI_U_SHIFT;
1465 aoffimmi.v = (modifier & WINED3D_SM4_AOFFIMMI_V_MASK) >> WINED3D_SM4_AOFFIMMI_V_SHIFT;
1466 aoffimmi.w = (modifier & WINED3D_SM4_AOFFIMMI_W_MASK) >> WINED3D_SM4_AOFFIMMI_W_SHIFT;
1467 ins->texel_offset.u = aoffimmi.u;
1468 ins->texel_offset.v = aoffimmi.v;
1469 ins->texel_offset.w = aoffimmi.w;
1473 static void shader_sm4_read_instruction(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins)
1475 const struct wined3d_sm4_opcode_info *opcode_info;
1476 DWORD opcode_token, opcode, previous_token;
1477 struct wined3d_sm4_data *priv = data;
1478 unsigned int i, len;
1479 const DWORD *p;
1481 list_move_head(&priv->src_free, &priv->src);
1483 opcode_token = *(*ptr)++;
1484 opcode = opcode_token & WINED3D_SM4_OPCODE_MASK;
1486 len = ((opcode_token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT);
1487 if (!len)
1488 len = **ptr;
1489 --len;
1491 if (TRACE_ON(d3d_bytecode))
1493 TRACE_(d3d_bytecode)("[ %08x ", opcode_token);
1494 for (i = 0; i < len; ++i)
1496 TRACE_(d3d_bytecode)("%08x ", (*ptr)[i]);
1498 TRACE_(d3d_bytecode)("]\n");
1501 if (!(opcode_info = get_opcode_info(opcode)))
1503 FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode, opcode_token);
1504 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1505 *ptr += len;
1506 return;
1509 ins->handler_idx = opcode_info->handler_idx;
1510 ins->flags = 0;
1511 ins->coissue = 0;
1512 ins->predicate = NULL;
1513 ins->dst_count = strlen(opcode_info->dst_info);
1514 ins->dst = priv->dst_param;
1515 ins->src_count = strlen(opcode_info->src_info);
1516 ins->src = priv->src_param;
1517 memset(&ins->texel_offset, 0, sizeof(ins->texel_offset));
1519 p = *ptr;
1520 *ptr += len;
1522 previous_token = opcode_token;
1523 while (previous_token & WINED3D_SM4_INSTRUCTION_MODIFIER)
1524 shader_sm4_read_instruction_modifier(previous_token = *p++, ins);
1526 if (opcode_info->read_opcode_func)
1528 opcode_info->read_opcode_func(ins, opcode, opcode_token, p, len, priv);
1530 else
1532 enum wined3d_shader_dst_modifier instruction_dst_modifier = WINED3DSPDM_NONE;
1534 ins->flags = (opcode_token & WINED3D_SM4_INSTRUCTION_FLAGS_MASK) >> WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT;
1536 if (ins->flags & WINED3D_SM4_INSTRUCTION_FLAG_SATURATE)
1538 ins->flags &= ~WINED3D_SM4_INSTRUCTION_FLAG_SATURATE;
1539 instruction_dst_modifier = WINED3DSPDM_SATURATE;
1542 for (i = 0; i < ins->dst_count; ++i)
1544 if (!(shader_sm4_read_dst_param(priv, &p, map_data_type(opcode_info->dst_info[i]), &priv->dst_param[i])))
1546 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1547 return;
1549 priv->dst_param[i].modifiers |= instruction_dst_modifier;
1552 for (i = 0; i < ins->src_count; ++i)
1554 if (!(shader_sm4_read_src_param(priv, &p, map_data_type(opcode_info->src_info[i]), &priv->src_param[i])))
1556 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1557 return;
1563 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
1565 struct wined3d_sm4_data *priv = data;
1566 return *ptr == priv->end;
1569 const struct wined3d_shader_frontend sm4_shader_frontend =
1571 shader_sm4_init,
1572 shader_sm4_free,
1573 shader_sm4_read_header,
1574 shader_sm4_read_instruction,
1575 shader_sm4_is_end,