wined3d: Introduce a wined3d_texture_update_sub_resource() helper.
[wine.git] / dlls / wined3d / shader_sm4.c
blob061ab51d024e18f56c9f332421f7b57f297d6356
1 /*
2 * Copyright 2009 Henri Verbeet for CodeWeavers
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
19 #include "config.h"
21 #include "wined3d_private.h"
23 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
24 WINE_DECLARE_DEBUG_CHANNEL(d3d_bytecode);
26 #define WINED3D_SM4_INSTRUCTION_MODIFIER (0x1u << 31)
28 #define WINED3D_SM4_MODIFIER_MASK 0x3fu
30 #define WINED3D_SM5_MODIFIER_DATA_TYPE_SHIFT 6
31 #define WINED3D_SM5_MODIFIER_DATA_TYPE_MASK (0xffffu << WINED3D_SM5_MODIFIER_DATA_TYPE_SHIFT)
33 #define WINED3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT 6
34 #define WINED3D_SM5_MODIFIER_RESOURCE_TYPE_MASK (0xfu << WINED3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT)
36 #define WINED3D_SM4_AOFFIMMI_U_SHIFT 9
37 #define WINED3D_SM4_AOFFIMMI_U_MASK (0xfu << WINED3D_SM4_AOFFIMMI_U_SHIFT)
38 #define WINED3D_SM4_AOFFIMMI_V_SHIFT 13
39 #define WINED3D_SM4_AOFFIMMI_V_MASK (0xfu << WINED3D_SM4_AOFFIMMI_V_SHIFT)
40 #define WINED3D_SM4_AOFFIMMI_W_SHIFT 17
41 #define WINED3D_SM4_AOFFIMMI_W_MASK (0xfu << WINED3D_SM4_AOFFIMMI_W_SHIFT)
43 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
44 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0x1fu << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
46 #define WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT 11
47 #define WINED3D_SM4_INSTRUCTION_FLAGS_MASK (0x7u << WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT)
49 #define WINED3D_SM4_RESOURCE_TYPE_SHIFT 11
50 #define WINED3D_SM4_RESOURCE_TYPE_MASK (0xfu << WINED3D_SM4_RESOURCE_TYPE_SHIFT)
52 #define WINED3D_SM4_PRIMITIVE_TYPE_SHIFT 11
53 #define WINED3D_SM4_PRIMITIVE_TYPE_MASK (0x3fu << WINED3D_SM4_PRIMITIVE_TYPE_SHIFT)
55 #define WINED3D_SM4_INDEX_TYPE_SHIFT 11
56 #define WINED3D_SM4_INDEX_TYPE_MASK (0x1u << WINED3D_SM4_INDEX_TYPE_SHIFT)
58 #define WINED3D_SM4_SAMPLER_MODE_SHIFT 11
59 #define WINED3D_SM4_SAMPLER_MODE_MASK (0xfu << WINED3D_SM4_SAMPLER_MODE_SHIFT)
61 #define WINED3D_SM4_SHADER_DATA_TYPE_SHIFT 11
62 #define WINED3D_SM4_SHADER_DATA_TYPE_MASK (0xfu << WINED3D_SM4_SHADER_DATA_TYPE_SHIFT)
64 #define WINED3D_SM4_INTERPOLATION_MODE_SHIFT 11
65 #define WINED3D_SM4_INTERPOLATION_MODE_MASK (0xfu << WINED3D_SM4_INTERPOLATION_MODE_SHIFT)
67 #define WINED3D_SM4_GLOBAL_FLAGS_SHIFT 11
68 #define WINED3D_SM4_GLOBAL_FLAGS_MASK (0xffu << WINED3D_SM4_GLOBAL_FLAGS_SHIFT)
70 #define WINED3D_SM5_PRECISE_SHIFT 19
71 #define WINED3D_SM5_PRECISE_MASK (0xfu << WINED3D_SM5_PRECISE_SHIFT)
73 #define WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT 11
74 #define WINED3D_SM5_CONTROL_POINT_COUNT_MASK (0xffu << WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT)
76 #define WINED3D_SM5_FP_ARRAY_SIZE_SHIFT 16
77 #define WINED3D_SM5_FP_TABLE_COUNT_MASK 0xffffu
79 #define WINED3D_SM5_UAV_FLAGS_SHIFT 15
80 #define WINED3D_SM5_UAV_FLAGS_MASK (0x1ffu << WINED3D_SM5_UAV_FLAGS_SHIFT)
82 #define WINED3D_SM5_SYNC_FLAGS_SHIFT 11
83 #define WINED3D_SM5_SYNC_FLAGS_MASK (0xffu << WINED3D_SM5_SYNC_FLAGS_SHIFT)
85 #define WINED3D_SM5_TESSELLATOR_SHIFT 11
86 #define WINED3D_SM5_TESSELLATOR_MASK (0xfu << WINED3D_SM5_TESSELLATOR_SHIFT)
88 #define WINED3D_SM4_OPCODE_MASK 0xff
90 #define WINED3D_SM4_REGISTER_MODIFIER (0x1u << 31)
92 #define WINED3D_SM4_ADDRESSING_SHIFT1 25
93 #define WINED3D_SM4_ADDRESSING_MASK1 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT1)
95 #define WINED3D_SM4_ADDRESSING_SHIFT0 22
96 #define WINED3D_SM4_ADDRESSING_MASK0 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT0)
98 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
99 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3u << WINED3D_SM4_REGISTER_ORDER_SHIFT)
101 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
102 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xffu << WINED3D_SM4_REGISTER_TYPE_SHIFT)
104 #define WINED3D_SM4_SWIZZLE_TYPE_SHIFT 2
105 #define WINED3D_SM4_SWIZZLE_TYPE_MASK (0x3u << WINED3D_SM4_SWIZZLE_TYPE_SHIFT)
107 #define WINED3D_SM4_DIMENSION_SHIFT 0
108 #define WINED3D_SM4_DIMENSION_MASK (0x3u << WINED3D_SM4_DIMENSION_SHIFT)
110 #define WINED3D_SM4_WRITEMASK_SHIFT 4
111 #define WINED3D_SM4_WRITEMASK_MASK (0xfu << WINED3D_SM4_WRITEMASK_SHIFT)
113 #define WINED3D_SM4_SWIZZLE_SHIFT 4
114 #define WINED3D_SM4_SWIZZLE_MASK (0xffu << WINED3D_SM4_SWIZZLE_SHIFT)
116 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
117 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
119 #define WINED3D_SM4_ADDRESSING_RELATIVE 0x2
120 #define WINED3D_SM4_ADDRESSING_OFFSET 0x1
122 #define WINED3D_SM4_INSTRUCTION_FLAG_SATURATE 0x4
124 #define WINED3D_SM4_CONDITIONAL_NZ (0x1u << 18)
126 enum wined3d_sm4_opcode
128 WINED3D_SM4_OP_ADD = 0x00,
129 WINED3D_SM4_OP_AND = 0x01,
130 WINED3D_SM4_OP_BREAK = 0x02,
131 WINED3D_SM4_OP_BREAKC = 0x03,
132 WINED3D_SM4_OP_CASE = 0x06,
133 WINED3D_SM4_OP_CONTINUE = 0x07,
134 WINED3D_SM4_OP_CONTINUEC = 0x08,
135 WINED3D_SM4_OP_CUT = 0x09,
136 WINED3D_SM4_OP_DEFAULT = 0x0a,
137 WINED3D_SM4_OP_DERIV_RTX = 0x0b,
138 WINED3D_SM4_OP_DERIV_RTY = 0x0c,
139 WINED3D_SM4_OP_DISCARD = 0x0d,
140 WINED3D_SM4_OP_DIV = 0x0e,
141 WINED3D_SM4_OP_DP2 = 0x0f,
142 WINED3D_SM4_OP_DP3 = 0x10,
143 WINED3D_SM4_OP_DP4 = 0x11,
144 WINED3D_SM4_OP_ELSE = 0x12,
145 WINED3D_SM4_OP_EMIT = 0x13,
146 WINED3D_SM4_OP_ENDIF = 0x15,
147 WINED3D_SM4_OP_ENDLOOP = 0x16,
148 WINED3D_SM4_OP_ENDSWITCH = 0x17,
149 WINED3D_SM4_OP_EQ = 0x18,
150 WINED3D_SM4_OP_EXP = 0x19,
151 WINED3D_SM4_OP_FRC = 0x1a,
152 WINED3D_SM4_OP_FTOI = 0x1b,
153 WINED3D_SM4_OP_FTOU = 0x1c,
154 WINED3D_SM4_OP_GE = 0x1d,
155 WINED3D_SM4_OP_IADD = 0x1e,
156 WINED3D_SM4_OP_IF = 0x1f,
157 WINED3D_SM4_OP_IEQ = 0x20,
158 WINED3D_SM4_OP_IGE = 0x21,
159 WINED3D_SM4_OP_ILT = 0x22,
160 WINED3D_SM4_OP_IMAD = 0x23,
161 WINED3D_SM4_OP_IMAX = 0x24,
162 WINED3D_SM4_OP_IMIN = 0x25,
163 WINED3D_SM4_OP_IMUL = 0x26,
164 WINED3D_SM4_OP_INE = 0x27,
165 WINED3D_SM4_OP_INEG = 0x28,
166 WINED3D_SM4_OP_ISHL = 0x29,
167 WINED3D_SM4_OP_ISHR = 0x2a,
168 WINED3D_SM4_OP_ITOF = 0x2b,
169 WINED3D_SM4_OP_LABEL = 0x2c,
170 WINED3D_SM4_OP_LD = 0x2d,
171 WINED3D_SM4_OP_LD2DMS = 0x2e,
172 WINED3D_SM4_OP_LOG = 0x2f,
173 WINED3D_SM4_OP_LOOP = 0x30,
174 WINED3D_SM4_OP_LT = 0x31,
175 WINED3D_SM4_OP_MAD = 0x32,
176 WINED3D_SM4_OP_MIN = 0x33,
177 WINED3D_SM4_OP_MAX = 0x34,
178 WINED3D_SM4_OP_SHADER_DATA = 0x35,
179 WINED3D_SM4_OP_MOV = 0x36,
180 WINED3D_SM4_OP_MOVC = 0x37,
181 WINED3D_SM4_OP_MUL = 0x38,
182 WINED3D_SM4_OP_NE = 0x39,
183 WINED3D_SM4_OP_NOP = 0x3a,
184 WINED3D_SM4_OP_NOT = 0x3b,
185 WINED3D_SM4_OP_OR = 0x3c,
186 WINED3D_SM4_OP_RESINFO = 0x3d,
187 WINED3D_SM4_OP_RET = 0x3e,
188 WINED3D_SM4_OP_RETC = 0x3f,
189 WINED3D_SM4_OP_ROUND_NE = 0x40,
190 WINED3D_SM4_OP_ROUND_NI = 0x41,
191 WINED3D_SM4_OP_ROUND_PI = 0x42,
192 WINED3D_SM4_OP_ROUND_Z = 0x43,
193 WINED3D_SM4_OP_RSQ = 0x44,
194 WINED3D_SM4_OP_SAMPLE = 0x45,
195 WINED3D_SM4_OP_SAMPLE_C = 0x46,
196 WINED3D_SM4_OP_SAMPLE_C_LZ = 0x47,
197 WINED3D_SM4_OP_SAMPLE_LOD = 0x48,
198 WINED3D_SM4_OP_SAMPLE_GRAD = 0x49,
199 WINED3D_SM4_OP_SAMPLE_B = 0x4a,
200 WINED3D_SM4_OP_SQRT = 0x4b,
201 WINED3D_SM4_OP_SWITCH = 0x4c,
202 WINED3D_SM4_OP_SINCOS = 0x4d,
203 WINED3D_SM4_OP_UDIV = 0x4e,
204 WINED3D_SM4_OP_ULT = 0x4f,
205 WINED3D_SM4_OP_UGE = 0x50,
206 WINED3D_SM4_OP_UMUL = 0x51,
207 WINED3D_SM4_OP_UMAX = 0x53,
208 WINED3D_SM4_OP_UMIN = 0x54,
209 WINED3D_SM4_OP_USHR = 0x55,
210 WINED3D_SM4_OP_UTOF = 0x56,
211 WINED3D_SM4_OP_XOR = 0x57,
212 WINED3D_SM4_OP_DCL_RESOURCE = 0x58,
213 WINED3D_SM4_OP_DCL_CONSTANT_BUFFER = 0x59,
214 WINED3D_SM4_OP_DCL_SAMPLER = 0x5a,
215 WINED3D_SM4_OP_DCL_INDEX_RANGE = 0x5b,
216 WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY = 0x5c,
217 WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE = 0x5d,
218 WINED3D_SM4_OP_DCL_VERTICES_OUT = 0x5e,
219 WINED3D_SM4_OP_DCL_INPUT = 0x5f,
220 WINED3D_SM4_OP_DCL_INPUT_SGV = 0x60,
221 WINED3D_SM4_OP_DCL_INPUT_SIV = 0x61,
222 WINED3D_SM4_OP_DCL_INPUT_PS = 0x62,
223 WINED3D_SM4_OP_DCL_INPUT_PS_SGV = 0x63,
224 WINED3D_SM4_OP_DCL_INPUT_PS_SIV = 0x64,
225 WINED3D_SM4_OP_DCL_OUTPUT = 0x65,
226 WINED3D_SM4_OP_DCL_OUTPUT_SIV = 0x67,
227 WINED3D_SM4_OP_DCL_TEMPS = 0x68,
228 WINED3D_SM4_OP_DCL_INDEXABLE_TEMP = 0x69,
229 WINED3D_SM4_OP_DCL_GLOBAL_FLAGS = 0x6a,
230 WINED3D_SM4_OP_LOD = 0x6c,
231 WINED3D_SM4_OP_GATHER4 = 0x6d,
232 WINED3D_SM4_OP_SAMPLE_POS = 0x6e,
233 WINED3D_SM4_OP_SAMPLE_INFO = 0x6f,
234 WINED3D_SM5_OP_HS_DECLS = 0x71,
235 WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE = 0x72,
236 WINED3D_SM5_OP_HS_FORK_PHASE = 0x73,
237 WINED3D_SM5_OP_HS_JOIN_PHASE = 0x74,
238 WINED3D_SM5_OP_EMIT_STREAM = 0x75,
239 WINED3D_SM5_OP_CUT_STREAM = 0x76,
240 WINED3D_SM5_OP_FCALL = 0x78,
241 WINED3D_SM5_OP_BUFINFO = 0x79,
242 WINED3D_SM5_OP_DERIV_RTX_COARSE = 0x7a,
243 WINED3D_SM5_OP_DERIV_RTX_FINE = 0x7b,
244 WINED3D_SM5_OP_DERIV_RTY_COARSE = 0x7c,
245 WINED3D_SM5_OP_DERIV_RTY_FINE = 0x7d,
246 WINED3D_SM5_OP_GATHER4_C = 0x7e,
247 WINED3D_SM5_OP_GATHER4_PO = 0x7f,
248 WINED3D_SM5_OP_GATHER4_PO_C = 0x80,
249 WINED3D_SM5_OP_RCP = 0x81,
250 WINED3D_SM5_OP_F32TOF16 = 0x82,
251 WINED3D_SM5_OP_F16TOF32 = 0x83,
252 WINED3D_SM5_OP_COUNTBITS = 0x86,
253 WINED3D_SM5_OP_FIRSTBIT_HI = 0x87,
254 WINED3D_SM5_OP_FIRSTBIT_LO = 0x88,
255 WINED3D_SM5_OP_FIRSTBIT_SHI = 0x89,
256 WINED3D_SM5_OP_UBFE = 0x8a,
257 WINED3D_SM5_OP_IBFE = 0x8b,
258 WINED3D_SM5_OP_BFI = 0x8c,
259 WINED3D_SM5_OP_BFREV = 0x8d,
260 WINED3D_SM5_OP_SWAPC = 0x8e,
261 WINED3D_SM5_OP_DCL_STREAM = 0x8f,
262 WINED3D_SM5_OP_DCL_FUNCTION_BODY = 0x90,
263 WINED3D_SM5_OP_DCL_FUNCTION_TABLE = 0x91,
264 WINED3D_SM5_OP_DCL_INTERFACE = 0x92,
265 WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT = 0x93,
266 WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT = 0x94,
267 WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN = 0x95,
268 WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING = 0x96,
269 WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE = 0x97,
270 WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR = 0x98,
271 WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT = 0x99,
272 WINED3D_SM5_OP_DCL_HS_JOIN_PHASE_INSTANCE_COUNT = 0x9a,
273 WINED3D_SM5_OP_DCL_THREAD_GROUP = 0x9b,
274 WINED3D_SM5_OP_DCL_UAV_TYPED = 0x9c,
275 WINED3D_SM5_OP_DCL_UAV_RAW = 0x9d,
276 WINED3D_SM5_OP_DCL_UAV_STRUCTURED = 0x9e,
277 WINED3D_SM5_OP_DCL_TGSM_RAW = 0x9f,
278 WINED3D_SM5_OP_DCL_TGSM_STRUCTURED = 0xa0,
279 WINED3D_SM5_OP_DCL_RESOURCE_RAW = 0xa1,
280 WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED = 0xa2,
281 WINED3D_SM5_OP_LD_UAV_TYPED = 0xa3,
282 WINED3D_SM5_OP_STORE_UAV_TYPED = 0xa4,
283 WINED3D_SM5_OP_LD_RAW = 0xa5,
284 WINED3D_SM5_OP_STORE_RAW = 0xa6,
285 WINED3D_SM5_OP_LD_STRUCTURED = 0xa7,
286 WINED3D_SM5_OP_STORE_STRUCTURED = 0xa8,
287 WINED3D_SM5_OP_ATOMIC_AND = 0xa9,
288 WINED3D_SM5_OP_ATOMIC_OR = 0xaa,
289 WINED3D_SM5_OP_ATOMIC_XOR = 0xab,
290 WINED3D_SM5_OP_ATOMIC_CMP_STORE = 0xac,
291 WINED3D_SM5_OP_ATOMIC_IADD = 0xad,
292 WINED3D_SM5_OP_ATOMIC_IMAX = 0xae,
293 WINED3D_SM5_OP_ATOMIC_IMIN = 0xaf,
294 WINED3D_SM5_OP_ATOMIC_UMAX = 0xb0,
295 WINED3D_SM5_OP_ATOMIC_UMIN = 0xb1,
296 WINED3D_SM5_OP_IMM_ATOMIC_ALLOC = 0xb2,
297 WINED3D_SM5_OP_IMM_ATOMIC_CONSUME = 0xb3,
298 WINED3D_SM5_OP_IMM_ATOMIC_IADD = 0xb4,
299 WINED3D_SM5_OP_IMM_ATOMIC_AND = 0xb5,
300 WINED3D_SM5_OP_IMM_ATOMIC_OR = 0xb6,
301 WINED3D_SM5_OP_IMM_ATOMIC_XOR = 0xb7,
302 WINED3D_SM5_OP_IMM_ATOMIC_EXCH = 0xb8,
303 WINED3D_SM5_OP_IMM_ATOMIC_CMP_EXCH = 0xb9,
304 WINED3D_SM5_OP_IMM_ATOMIC_IMAX = 0xba,
305 WINED3D_SM5_OP_IMM_ATOMIC_IMIN = 0xbb,
306 WINED3D_SM5_OP_IMM_ATOMIC_UMAX = 0xbc,
307 WINED3D_SM5_OP_IMM_ATOMIC_UMIN = 0xbd,
308 WINED3D_SM5_OP_SYNC = 0xbe,
309 WINED3D_SM5_OP_EVAL_SAMPLE_INDEX = 0xcc,
310 WINED3D_SM5_OP_DCL_GS_INSTANCES = 0xce,
313 enum wined3d_sm4_instruction_modifier
315 WINED3D_SM4_MODIFIER_AOFFIMMI = 0x1,
316 WINED3D_SM5_MODIFIER_RESOURCE_TYPE = 0x2,
317 WINED3D_SM5_MODIFIER_DATA_TYPE = 0x3,
320 enum wined3d_sm4_register_type
322 WINED3D_SM4_RT_TEMP = 0x00,
323 WINED3D_SM4_RT_INPUT = 0x01,
324 WINED3D_SM4_RT_OUTPUT = 0x02,
325 WINED3D_SM4_RT_INDEXABLE_TEMP = 0x03,
326 WINED3D_SM4_RT_IMMCONST = 0x04,
327 WINED3D_SM4_RT_SAMPLER = 0x06,
328 WINED3D_SM4_RT_RESOURCE = 0x07,
329 WINED3D_SM4_RT_CONSTBUFFER = 0x08,
330 WINED3D_SM4_RT_IMMCONSTBUFFER = 0x09,
331 WINED3D_SM4_RT_PRIMID = 0x0b,
332 WINED3D_SM4_RT_DEPTHOUT = 0x0c,
333 WINED3D_SM4_RT_NULL = 0x0d,
334 WINED3D_SM4_RT_RASTERIZER = 0x0e,
335 WINED3D_SM4_RT_OMASK = 0x0f,
336 WINED3D_SM5_RT_STREAM = 0x10,
337 WINED3D_SM5_RT_FUNCTION_BODY = 0x11,
338 WINED3D_SM5_RT_FUNCTION_POINTER = 0x13,
339 WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID = 0x16,
340 WINED3D_SM5_RT_FORK_INSTANCE_ID = 0x17,
341 WINED3D_SM5_RT_JOIN_INSTANCE_ID = 0x18,
342 WINED3D_SM5_RT_INPUT_CONTROL_POINT = 0x19,
343 WINED3D_SM5_RT_OUTPUT_CONTROL_POINT = 0x1a,
344 WINED3D_SM5_RT_PATCH_CONSTANT_DATA = 0x1b,
345 WINED3D_SM5_RT_DOMAIN_LOCATION = 0x1c,
346 WINED3D_SM5_RT_UAV = 0x1e,
347 WINED3D_SM5_RT_SHARED_MEMORY = 0x1f,
348 WINED3D_SM5_RT_THREAD_ID = 0x20,
349 WINED3D_SM5_RT_THREAD_GROUP_ID = 0x21,
350 WINED3D_SM5_RT_LOCAL_THREAD_ID = 0x22,
351 WINED3D_SM5_RT_COVERAGE = 0x23,
352 WINED3D_SM5_RT_LOCAL_THREAD_INDEX = 0x24,
353 WINED3D_SM5_RT_GS_INSTANCE_ID = 0x25,
354 WINED3D_SM5_RT_DEPTHOUT_GREATER_EQUAL = 0x26,
355 WINED3D_SM5_RT_DEPTHOUT_LESS_EQUAL = 0x27,
358 enum wined3d_sm4_output_primitive_type
360 WINED3D_SM4_OUTPUT_PT_POINTLIST = 0x1,
361 WINED3D_SM4_OUTPUT_PT_LINESTRIP = 0x3,
362 WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP = 0x5,
365 enum wined3d_sm4_input_primitive_type
367 WINED3D_SM4_INPUT_PT_POINT = 0x01,
368 WINED3D_SM4_INPUT_PT_LINE = 0x02,
369 WINED3D_SM4_INPUT_PT_TRIANGLE = 0x03,
370 WINED3D_SM4_INPUT_PT_LINEADJ = 0x06,
371 WINED3D_SM4_INPUT_PT_TRIANGLEADJ = 0x07,
372 WINED3D_SM5_INPUT_PT_PATCH1 = 0x08,
373 WINED3D_SM5_INPUT_PT_PATCH2 = 0x09,
374 WINED3D_SM5_INPUT_PT_PATCH3 = 0x0a,
375 WINED3D_SM5_INPUT_PT_PATCH4 = 0x0b,
376 WINED3D_SM5_INPUT_PT_PATCH5 = 0x0c,
377 WINED3D_SM5_INPUT_PT_PATCH6 = 0x0d,
378 WINED3D_SM5_INPUT_PT_PATCH7 = 0x0e,
379 WINED3D_SM5_INPUT_PT_PATCH8 = 0x0f,
380 WINED3D_SM5_INPUT_PT_PATCH9 = 0x10,
381 WINED3D_SM5_INPUT_PT_PATCH10 = 0x11,
382 WINED3D_SM5_INPUT_PT_PATCH11 = 0x12,
383 WINED3D_SM5_INPUT_PT_PATCH12 = 0x13,
384 WINED3D_SM5_INPUT_PT_PATCH13 = 0x14,
385 WINED3D_SM5_INPUT_PT_PATCH14 = 0x15,
386 WINED3D_SM5_INPUT_PT_PATCH15 = 0x16,
387 WINED3D_SM5_INPUT_PT_PATCH16 = 0x17,
388 WINED3D_SM5_INPUT_PT_PATCH17 = 0x18,
389 WINED3D_SM5_INPUT_PT_PATCH18 = 0x19,
390 WINED3D_SM5_INPUT_PT_PATCH19 = 0x1a,
391 WINED3D_SM5_INPUT_PT_PATCH20 = 0x1b,
392 WINED3D_SM5_INPUT_PT_PATCH21 = 0x1c,
393 WINED3D_SM5_INPUT_PT_PATCH22 = 0x1d,
394 WINED3D_SM5_INPUT_PT_PATCH23 = 0x1e,
395 WINED3D_SM5_INPUT_PT_PATCH24 = 0x1f,
396 WINED3D_SM5_INPUT_PT_PATCH25 = 0x20,
397 WINED3D_SM5_INPUT_PT_PATCH26 = 0x21,
398 WINED3D_SM5_INPUT_PT_PATCH27 = 0x22,
399 WINED3D_SM5_INPUT_PT_PATCH28 = 0x23,
400 WINED3D_SM5_INPUT_PT_PATCH29 = 0x24,
401 WINED3D_SM5_INPUT_PT_PATCH30 = 0x25,
402 WINED3D_SM5_INPUT_PT_PATCH31 = 0x26,
403 WINED3D_SM5_INPUT_PT_PATCH32 = 0x27,
406 enum wined3d_sm4_swizzle_type
408 WINED3D_SM4_SWIZZLE_NONE = 0x0,
409 WINED3D_SM4_SWIZZLE_VEC4 = 0x1,
410 WINED3D_SM4_SWIZZLE_SCALAR = 0x2,
413 enum wined3d_sm4_dimension
415 WINED3D_SM4_DIMENSION_SCALAR = 0x1,
416 WINED3D_SM4_DIMENSION_VEC4 = 0x2,
419 enum wined3d_sm4_resource_type
421 WINED3D_SM4_RESOURCE_BUFFER = 0x1,
422 WINED3D_SM4_RESOURCE_TEXTURE_1D = 0x2,
423 WINED3D_SM4_RESOURCE_TEXTURE_2D = 0x3,
424 WINED3D_SM4_RESOURCE_TEXTURE_2DMS = 0x4,
425 WINED3D_SM4_RESOURCE_TEXTURE_3D = 0x5,
426 WINED3D_SM4_RESOURCE_TEXTURE_CUBE = 0x6,
427 WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY = 0x7,
428 WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY = 0x8,
429 WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY = 0x9,
430 WINED3D_SM4_RESOURCE_TEXTURE_CUBEARRAY = 0xa,
433 enum wined3d_sm4_data_type
435 WINED3D_SM4_DATA_UNORM = 0x1,
436 WINED3D_SM4_DATA_SNORM = 0x2,
437 WINED3D_SM4_DATA_INT = 0x3,
438 WINED3D_SM4_DATA_UINT = 0x4,
439 WINED3D_SM4_DATA_FLOAT = 0x5,
442 enum wined3d_sm4_sampler_mode
444 WINED3D_SM4_SAMPLER_DEFAULT = 0x0,
445 WINED3D_SM4_SAMPLER_COMPARISON = 0x1,
448 enum wined3d_sm4_shader_data_type
450 WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER = 0x3,
451 WINED3D_SM4_SHADER_DATA_MESSAGE = 0x4,
454 struct wined3d_shader_src_param_entry
456 struct list entry;
457 struct wined3d_shader_src_param param;
460 struct wined3d_sm4_data
462 struct wined3d_shader_version shader_version;
463 const DWORD *start, *end;
465 unsigned int output_map[MAX_REG_OUTPUT];
467 struct wined3d_shader_src_param src_param[5];
468 struct wined3d_shader_dst_param dst_param[2];
469 struct list src_free;
470 struct list src;
471 struct wined3d_shader_immediate_constant_buffer icb;
474 struct wined3d_sm4_opcode_info
476 enum wined3d_sm4_opcode opcode;
477 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
478 const char *dst_info;
479 const char *src_info;
480 void (*read_opcode_func)(struct wined3d_shader_instruction *ins,
481 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
482 struct wined3d_sm4_data *priv);
485 static const enum wined3d_primitive_type output_primitive_type_table[] =
487 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
488 /* WINED3D_SM4_OUTPUT_PT_POINTLIST */ WINED3D_PT_POINTLIST,
489 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
490 /* WINED3D_SM4_OUTPUT_PT_LINESTRIP */ WINED3D_PT_LINESTRIP,
491 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
492 /* WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP */ WINED3D_PT_TRIANGLESTRIP,
495 static const enum wined3d_primitive_type input_primitive_type_table[] =
497 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
498 /* WINED3D_SM4_INPUT_PT_POINT */ WINED3D_PT_POINTLIST,
499 /* WINED3D_SM4_INPUT_PT_LINE */ WINED3D_PT_LINELIST,
500 /* WINED3D_SM4_INPUT_PT_TRIANGLE */ WINED3D_PT_TRIANGLELIST,
501 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
502 /* UNKNOWN */ WINED3D_PT_UNDEFINED,
503 /* WINED3D_SM4_INPUT_PT_LINEADJ */ WINED3D_PT_LINELIST_ADJ,
504 /* WINED3D_SM4_INPUT_PT_TRIANGLEADJ */ WINED3D_PT_TRIANGLELIST_ADJ,
507 static const enum wined3d_shader_resource_type resource_type_table[] =
509 /* 0 */ WINED3D_SHADER_RESOURCE_NONE,
510 /* WINED3D_SM4_RESOURCE_BUFFER */ WINED3D_SHADER_RESOURCE_BUFFER,
511 /* WINED3D_SM4_RESOURCE_TEXTURE_1D */ WINED3D_SHADER_RESOURCE_TEXTURE_1D,
512 /* WINED3D_SM4_RESOURCE_TEXTURE_2D */ WINED3D_SHADER_RESOURCE_TEXTURE_2D,
513 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMS */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMS,
514 /* WINED3D_SM4_RESOURCE_TEXTURE_3D */ WINED3D_SHADER_RESOURCE_TEXTURE_3D,
515 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBE */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBE,
516 /* WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_1DARRAY,
517 /* WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DARRAY,
518 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY,
519 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBEARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBEARRAY,
522 static const enum wined3d_data_type data_type_table[] =
524 /* 0 */ WINED3D_DATA_FLOAT,
525 /* WINED3D_SM4_DATA_UNORM */ WINED3D_DATA_UNORM,
526 /* WINED3D_SM4_DATA_SNORM */ WINED3D_DATA_SNORM,
527 /* WINED3D_SM4_DATA_INT */ WINED3D_DATA_INT,
528 /* WINED3D_SM4_DATA_UINT */ WINED3D_DATA_UINT,
529 /* WINED3D_SM4_DATA_FLOAT */ WINED3D_DATA_FLOAT,
532 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr, const DWORD *end,
533 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param);
534 static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr, const DWORD *end,
535 enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param);
537 static void shader_sm4_read_conditional_op(struct wined3d_shader_instruction *ins,
538 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
539 struct wined3d_sm4_data *priv)
541 shader_sm4_read_src_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_UINT, &priv->src_param[0]);
542 ins->flags = (opcode_token & WINED3D_SM4_CONDITIONAL_NZ) ?
543 WINED3D_SHADER_CONDITIONAL_OP_NZ : WINED3D_SHADER_CONDITIONAL_OP_Z;
546 static void shader_sm4_read_shader_data(struct wined3d_shader_instruction *ins,
547 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
548 struct wined3d_sm4_data *priv)
550 enum wined3d_sm4_shader_data_type type;
551 unsigned int icb_size;
553 type = (opcode_token & WINED3D_SM4_SHADER_DATA_TYPE_MASK) >> WINED3D_SM4_SHADER_DATA_TYPE_SHIFT;
554 if (type != WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER)
556 FIXME("Ignoring shader data type %#x.\n", type);
557 ins->handler_idx = WINED3DSIH_NOP;
558 return;
561 ++tokens;
562 icb_size = token_count - 1;
563 if (icb_size % 4 || icb_size > MAX_IMMEDIATE_CONSTANT_BUFFER_SIZE)
565 FIXME("Unexpected immediate constant buffer size %u.\n", icb_size);
566 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
567 return;
570 priv->icb.vec4_count = icb_size / 4;
571 memcpy(priv->icb.data, tokens, sizeof(*tokens) * icb_size);
572 ins->declaration.icb = &priv->icb;
575 static void shader_sm4_read_dcl_resource(struct wined3d_shader_instruction *ins,
576 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
577 struct wined3d_sm4_data *priv)
579 enum wined3d_sm4_resource_type resource_type;
580 enum wined3d_sm4_data_type data_type;
581 enum wined3d_data_type reg_data_type;
582 DWORD components;
584 resource_type = (opcode_token & WINED3D_SM4_RESOURCE_TYPE_MASK) >> WINED3D_SM4_RESOURCE_TYPE_SHIFT;
585 if (!resource_type || (resource_type >= ARRAY_SIZE(resource_type_table)))
587 FIXME("Unhandled resource type %#x.\n", resource_type);
588 ins->declaration.semantic.resource_type = WINED3D_SHADER_RESOURCE_NONE;
590 else
592 ins->declaration.semantic.resource_type = resource_type_table[resource_type];
594 reg_data_type = opcode == WINED3D_SM4_OP_DCL_RESOURCE ? WINED3D_DATA_RESOURCE : WINED3D_DATA_UAV;
595 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], reg_data_type, &ins->declaration.semantic.reg);
597 components = *tokens++;
598 if ((components & 0xfff0) != (components & 0xf) * 0x1110)
599 FIXME("Components (%#x) have different data types.\n", components);
600 data_type = components & 0xf;
602 if (!data_type || (data_type >= ARRAY_SIZE(data_type_table)))
604 FIXME("Unhandled data type %#x.\n", data_type);
605 ins->declaration.semantic.resource_data_type = WINED3D_DATA_FLOAT;
607 else
609 ins->declaration.semantic.resource_data_type = data_type_table[data_type];
612 if (reg_data_type == WINED3D_DATA_UAV)
613 ins->flags = (opcode_token & WINED3D_SM5_UAV_FLAGS_MASK) >> WINED3D_SM5_UAV_FLAGS_SHIFT;
616 static void shader_sm4_read_dcl_constant_buffer(struct wined3d_shader_instruction *ins,
617 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
618 struct wined3d_sm4_data *priv)
620 shader_sm4_read_src_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_FLOAT, &ins->declaration.src);
621 if (opcode_token & WINED3D_SM4_INDEX_TYPE_MASK)
622 ins->flags |= WINED3DSI_INDEXED_DYNAMIC;
625 static void shader_sm4_read_dcl_sampler(struct wined3d_shader_instruction *ins,
626 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
627 struct wined3d_sm4_data *priv)
629 ins->flags = (opcode_token & WINED3D_SM4_SAMPLER_MODE_MASK) >> WINED3D_SM4_SAMPLER_MODE_SHIFT;
630 if (ins->flags & ~WINED3D_SM4_SAMPLER_COMPARISON)
631 FIXME("Unhandled sampler mode %#x.\n", ins->flags);
632 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_SAMPLER, &ins->declaration.dst);
635 static void shader_sm4_read_dcl_index_range(struct wined3d_shader_instruction *ins,
636 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
637 struct wined3d_sm4_data *priv)
639 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_OPAQUE,
640 &ins->declaration.index_range.first_register);
641 ins->declaration.index_range.last_register = *tokens;
644 static void shader_sm4_read_dcl_output_topology(struct wined3d_shader_instruction *ins,
645 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
646 struct wined3d_sm4_data *priv)
648 enum wined3d_sm4_output_primitive_type primitive_type;
650 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
651 if (primitive_type >= ARRAY_SIZE(output_primitive_type_table))
652 ins->declaration.primitive_type.type = WINED3D_PT_UNDEFINED;
653 else
654 ins->declaration.primitive_type.type = output_primitive_type_table[primitive_type];
656 if (ins->declaration.primitive_type.type == WINED3D_PT_UNDEFINED)
657 FIXME("Unhandled output primitive type %#x.\n", primitive_type);
660 static void shader_sm4_read_dcl_input_primitive(struct wined3d_shader_instruction *ins,
661 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
662 struct wined3d_sm4_data *priv)
664 enum wined3d_sm4_input_primitive_type primitive_type;
666 primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
667 if (WINED3D_SM5_INPUT_PT_PATCH1 <= primitive_type && primitive_type <= WINED3D_SM5_INPUT_PT_PATCH32)
669 ins->declaration.primitive_type.type = WINED3D_PT_PATCH;
670 ins->declaration.primitive_type.patch_vertex_count = primitive_type - WINED3D_SM5_INPUT_PT_PATCH1 + 1;
672 else if (primitive_type >= ARRAY_SIZE(input_primitive_type_table))
674 ins->declaration.primitive_type.type = WINED3D_PT_UNDEFINED;
676 else
678 ins->declaration.primitive_type.type = input_primitive_type_table[primitive_type];
681 if (ins->declaration.primitive_type.type == WINED3D_PT_UNDEFINED)
682 FIXME("Unhandled input primitive type %#x.\n", primitive_type);
685 static void shader_sm4_read_declaration_count(struct wined3d_shader_instruction *ins,
686 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
687 struct wined3d_sm4_data *priv)
689 ins->declaration.count = *tokens;
692 static void shader_sm4_read_declaration_dst(struct wined3d_shader_instruction *ins,
693 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
694 struct wined3d_sm4_data *priv)
696 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_FLOAT, &ins->declaration.dst);
699 static void shader_sm4_read_declaration_register_semantic(struct wined3d_shader_instruction *ins,
700 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
701 struct wined3d_sm4_data *priv)
703 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_FLOAT,
704 &ins->declaration.register_semantic.reg);
705 ins->declaration.register_semantic.sysval_semantic = *tokens;
708 static void shader_sm4_read_dcl_input_ps(struct wined3d_shader_instruction *ins,
709 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
710 struct wined3d_sm4_data *priv)
712 ins->flags = (opcode_token & WINED3D_SM4_INTERPOLATION_MODE_MASK) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT;
713 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_FLOAT, &ins->declaration.dst);
716 static void shader_sm4_read_dcl_input_ps_siv(struct wined3d_shader_instruction *ins,
717 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
718 struct wined3d_sm4_data *priv)
720 ins->flags = (opcode_token & WINED3D_SM4_INTERPOLATION_MODE_MASK) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT;
721 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_FLOAT,
722 &ins->declaration.register_semantic.reg);
723 ins->declaration.register_semantic.sysval_semantic = *tokens;
726 static void shader_sm4_read_dcl_indexable_temp(struct wined3d_shader_instruction *ins,
727 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
728 struct wined3d_sm4_data *priv)
730 ins->declaration.indexable_temp.register_idx = *tokens++;
731 ins->declaration.indexable_temp.register_size = *tokens++;
732 ins->declaration.indexable_temp.component_count = *tokens;
735 static void shader_sm4_read_dcl_global_flags(struct wined3d_shader_instruction *ins,
736 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
737 struct wined3d_sm4_data *priv)
739 ins->flags = (opcode_token & WINED3D_SM4_GLOBAL_FLAGS_MASK) >> WINED3D_SM4_GLOBAL_FLAGS_SHIFT;
742 static void shader_sm5_read_fcall(struct wined3d_shader_instruction *ins,
743 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
744 struct wined3d_sm4_data *priv)
746 priv->src_param[0].reg.u.fp_body_idx = *tokens++;
747 shader_sm4_read_src_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_OPAQUE, &priv->src_param[0]);
750 static void shader_sm5_read_dcl_function_body(struct wined3d_shader_instruction *ins,
751 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
752 struct wined3d_sm4_data *priv)
754 ins->declaration.index = *tokens;
757 static void shader_sm5_read_dcl_function_table(struct wined3d_shader_instruction *ins,
758 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
759 struct wined3d_sm4_data *priv)
761 ins->declaration.index = *tokens++;
762 FIXME("Ignoring set of function bodies (count %u).\n", *tokens);
765 static void shader_sm5_read_dcl_interface(struct wined3d_shader_instruction *ins,
766 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
767 struct wined3d_sm4_data *priv)
769 ins->declaration.fp.index = *tokens++;
770 ins->declaration.fp.body_count = *tokens++;
771 ins->declaration.fp.array_size = *tokens >> WINED3D_SM5_FP_ARRAY_SIZE_SHIFT;
772 ins->declaration.fp.table_count = *tokens++ & WINED3D_SM5_FP_TABLE_COUNT_MASK;
773 FIXME("Ignoring set of function tables (count %u).\n", ins->declaration.fp.table_count);
776 static void shader_sm5_read_control_point_count(struct wined3d_shader_instruction *ins,
777 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
778 struct wined3d_sm4_data *priv)
780 ins->declaration.count = (opcode_token & WINED3D_SM5_CONTROL_POINT_COUNT_MASK)
781 >> WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT;
784 static void shader_sm5_read_dcl_tessellator_domain(struct wined3d_shader_instruction *ins,
785 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
786 struct wined3d_sm4_data *priv)
788 ins->declaration.tessellator_domain = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
789 >> WINED3D_SM5_TESSELLATOR_SHIFT;
792 static void shader_sm5_read_dcl_tessellator_partitioning(struct wined3d_shader_instruction *ins,
793 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
794 struct wined3d_sm4_data *priv)
796 ins->declaration.tessellator_partitioning = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
797 >> WINED3D_SM5_TESSELLATOR_SHIFT;
800 static void shader_sm5_read_dcl_tessellator_output_primitive(struct wined3d_shader_instruction *ins,
801 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
802 struct wined3d_sm4_data *priv)
804 ins->declaration.tessellator_output_primitive = (opcode_token & WINED3D_SM5_TESSELLATOR_MASK)
805 >> WINED3D_SM5_TESSELLATOR_SHIFT;
808 static void shader_sm5_read_dcl_hs_max_tessfactor(struct wined3d_shader_instruction *ins,
809 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
810 struct wined3d_sm4_data *priv)
812 ins->declaration.max_tessellation_factor = *(float *)tokens;
815 static void shader_sm5_read_dcl_thread_group(struct wined3d_shader_instruction *ins,
816 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
817 struct wined3d_sm4_data *priv)
819 ins->declaration.thread_group_size.x = *tokens++;
820 ins->declaration.thread_group_size.y = *tokens++;
821 ins->declaration.thread_group_size.z = *tokens++;
824 static void shader_sm5_read_dcl_uav_raw(struct wined3d_shader_instruction *ins,
825 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
826 struct wined3d_sm4_data *priv)
828 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_UAV, &ins->declaration.dst);
829 ins->flags = (opcode_token & WINED3D_SM5_UAV_FLAGS_MASK) >> WINED3D_SM5_UAV_FLAGS_SHIFT;
832 static void shader_sm5_read_dcl_uav_structured(struct wined3d_shader_instruction *ins,
833 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
834 struct wined3d_sm4_data *priv)
836 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_UAV,
837 &ins->declaration.structured_resource.reg);
838 ins->flags = (opcode_token & WINED3D_SM5_UAV_FLAGS_MASK) >> WINED3D_SM5_UAV_FLAGS_SHIFT;
839 ins->declaration.structured_resource.byte_stride = *tokens;
840 if (ins->declaration.structured_resource.byte_stride % 4)
841 FIXME("Byte stride %u is not multiple of 4.\n", ins->declaration.structured_resource.byte_stride);
844 static void shader_sm5_read_dcl_tgsm_raw(struct wined3d_shader_instruction *ins,
845 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
846 struct wined3d_sm4_data *priv)
848 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_FLOAT, &ins->declaration.tgsm_raw.reg);
849 ins->declaration.tgsm_raw.byte_count = *tokens;
850 if (ins->declaration.tgsm_raw.byte_count % 4)
851 FIXME("Byte count %u is not multiple of 4.\n", ins->declaration.tgsm_raw.byte_count);
854 static void shader_sm5_read_dcl_tgsm_structured(struct wined3d_shader_instruction *ins,
855 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
856 struct wined3d_sm4_data *priv)
858 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_FLOAT,
859 &ins->declaration.tgsm_structured.reg);
860 ins->declaration.tgsm_structured.byte_stride = *tokens++;
861 ins->declaration.tgsm_structured.structure_count = *tokens;
862 if (ins->declaration.tgsm_structured.byte_stride % 4)
863 FIXME("Byte stride %u is not multiple of 4.\n", ins->declaration.tgsm_structured.byte_stride);
866 static void shader_sm5_read_dcl_resource_structured(struct wined3d_shader_instruction *ins,
867 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
868 struct wined3d_sm4_data *priv)
870 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_RESOURCE,
871 &ins->declaration.structured_resource.reg);
872 ins->declaration.structured_resource.byte_stride = *tokens;
873 if (ins->declaration.structured_resource.byte_stride % 4)
874 FIXME("Byte stride %u is not multiple of 4.\n", ins->declaration.structured_resource.byte_stride);
877 static void shader_sm5_read_dcl_resource_raw(struct wined3d_shader_instruction *ins,
878 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
879 struct wined3d_sm4_data *priv)
881 shader_sm4_read_dst_param(priv, &tokens, &tokens[token_count], WINED3D_DATA_RESOURCE, &ins->declaration.dst);
884 static void shader_sm5_read_sync(struct wined3d_shader_instruction *ins,
885 DWORD opcode, DWORD opcode_token, const DWORD *tokens, unsigned int token_count,
886 struct wined3d_sm4_data *priv)
888 ins->flags = (opcode_token & WINED3D_SM5_SYNC_FLAGS_MASK) >> WINED3D_SM5_SYNC_FLAGS_SHIFT;
892 * f -> WINED3D_DATA_FLOAT
893 * i -> WINED3D_DATA_INT
894 * u -> WINED3D_DATA_UINT
895 * O -> WINED3D_DATA_OPAQUE
896 * R -> WINED3D_DATA_RESOURCE
897 * S -> WINED3D_DATA_SAMPLER
898 * U -> WINED3D_DATA_UAV
900 static const struct wined3d_sm4_opcode_info opcode_table[] =
902 {WINED3D_SM4_OP_ADD, WINED3DSIH_ADD, "f", "ff"},
903 {WINED3D_SM4_OP_AND, WINED3DSIH_AND, "u", "uu"},
904 {WINED3D_SM4_OP_BREAK, WINED3DSIH_BREAK, "", ""},
905 {WINED3D_SM4_OP_BREAKC, WINED3DSIH_BREAKP, "", "u",
906 shader_sm4_read_conditional_op},
907 {WINED3D_SM4_OP_CASE, WINED3DSIH_CASE, "", "u"},
908 {WINED3D_SM4_OP_CONTINUE, WINED3DSIH_CONTINUE, "", ""},
909 {WINED3D_SM4_OP_CONTINUEC, WINED3DSIH_CONTINUEP, "", "u",
910 shader_sm4_read_conditional_op},
911 {WINED3D_SM4_OP_CUT, WINED3DSIH_CUT, "", ""},
912 {WINED3D_SM4_OP_DEFAULT, WINED3DSIH_DEFAULT, "", ""},
913 {WINED3D_SM4_OP_DERIV_RTX, WINED3DSIH_DSX, "f", "f"},
914 {WINED3D_SM4_OP_DERIV_RTY, WINED3DSIH_DSY, "f", "f"},
915 {WINED3D_SM4_OP_DISCARD, WINED3DSIH_TEXKILL, "", "u",
916 shader_sm4_read_conditional_op},
917 {WINED3D_SM4_OP_DIV, WINED3DSIH_DIV, "f", "ff"},
918 {WINED3D_SM4_OP_DP2, WINED3DSIH_DP2, "f", "ff"},
919 {WINED3D_SM4_OP_DP3, WINED3DSIH_DP3, "f", "ff"},
920 {WINED3D_SM4_OP_DP4, WINED3DSIH_DP4, "f", "ff"},
921 {WINED3D_SM4_OP_ELSE, WINED3DSIH_ELSE, "", ""},
922 {WINED3D_SM4_OP_EMIT, WINED3DSIH_EMIT, "", ""},
923 {WINED3D_SM4_OP_ENDIF, WINED3DSIH_ENDIF, "", ""},
924 {WINED3D_SM4_OP_ENDLOOP, WINED3DSIH_ENDLOOP, "", ""},
925 {WINED3D_SM4_OP_ENDSWITCH, WINED3DSIH_ENDSWITCH, "", ""},
926 {WINED3D_SM4_OP_EQ, WINED3DSIH_EQ, "u", "ff"},
927 {WINED3D_SM4_OP_EXP, WINED3DSIH_EXP, "f", "f"},
928 {WINED3D_SM4_OP_FRC, WINED3DSIH_FRC, "f", "f"},
929 {WINED3D_SM4_OP_FTOI, WINED3DSIH_FTOI, "i", "f"},
930 {WINED3D_SM4_OP_FTOU, WINED3DSIH_FTOU, "u", "f"},
931 {WINED3D_SM4_OP_GE, WINED3DSIH_GE, "u", "ff"},
932 {WINED3D_SM4_OP_IADD, WINED3DSIH_IADD, "i", "ii"},
933 {WINED3D_SM4_OP_IF, WINED3DSIH_IF, "", "u",
934 shader_sm4_read_conditional_op},
935 {WINED3D_SM4_OP_IEQ, WINED3DSIH_IEQ, "u", "ii"},
936 {WINED3D_SM4_OP_IGE, WINED3DSIH_IGE, "u", "ii"},
937 {WINED3D_SM4_OP_ILT, WINED3DSIH_ILT, "u", "ii"},
938 {WINED3D_SM4_OP_IMAD, WINED3DSIH_IMAD, "i", "iii"},
939 {WINED3D_SM4_OP_IMAX, WINED3DSIH_IMAX, "i", "ii"},
940 {WINED3D_SM4_OP_IMIN, WINED3DSIH_IMIN, "i", "ii"},
941 {WINED3D_SM4_OP_IMUL, WINED3DSIH_IMUL, "ii", "ii"},
942 {WINED3D_SM4_OP_INE, WINED3DSIH_INE, "u", "ii"},
943 {WINED3D_SM4_OP_INEG, WINED3DSIH_INEG, "i", "i"},
944 {WINED3D_SM4_OP_ISHL, WINED3DSIH_ISHL, "i", "ii"},
945 {WINED3D_SM4_OP_ISHR, WINED3DSIH_ISHR, "i", "ii"},
946 {WINED3D_SM4_OP_ITOF, WINED3DSIH_ITOF, "f", "i"},
947 {WINED3D_SM4_OP_LABEL, WINED3DSIH_LABEL, "", "O"},
948 {WINED3D_SM4_OP_LD, WINED3DSIH_LD, "u", "iR"},
949 {WINED3D_SM4_OP_LD2DMS, WINED3DSIH_LD2DMS, "u", "iRi"},
950 {WINED3D_SM4_OP_LOG, WINED3DSIH_LOG, "f", "f"},
951 {WINED3D_SM4_OP_LOOP, WINED3DSIH_LOOP, "", ""},
952 {WINED3D_SM4_OP_LT, WINED3DSIH_LT, "u", "ff"},
953 {WINED3D_SM4_OP_MAD, WINED3DSIH_MAD, "f", "fff"},
954 {WINED3D_SM4_OP_MIN, WINED3DSIH_MIN, "f", "ff"},
955 {WINED3D_SM4_OP_MAX, WINED3DSIH_MAX, "f", "ff"},
956 {WINED3D_SM4_OP_SHADER_DATA, WINED3DSIH_DCL_IMMEDIATE_CONSTANT_BUFFER, "", "",
957 shader_sm4_read_shader_data},
958 {WINED3D_SM4_OP_MOV, WINED3DSIH_MOV, "f", "f"},
959 {WINED3D_SM4_OP_MOVC, WINED3DSIH_MOVC, "f", "uff"},
960 {WINED3D_SM4_OP_MUL, WINED3DSIH_MUL, "f", "ff"},
961 {WINED3D_SM4_OP_NE, WINED3DSIH_NE, "u", "ff"},
962 {WINED3D_SM4_OP_NOP, WINED3DSIH_NOP, "", ""},
963 {WINED3D_SM4_OP_NOT, WINED3DSIH_NOT, "u", "u"},
964 {WINED3D_SM4_OP_OR, WINED3DSIH_OR, "u", "uu"},
965 {WINED3D_SM4_OP_RESINFO, WINED3DSIH_RESINFO, "f", "iR"},
966 {WINED3D_SM4_OP_RET, WINED3DSIH_RET, "", ""},
967 {WINED3D_SM4_OP_RETC, WINED3DSIH_RETP, "", "u",
968 shader_sm4_read_conditional_op},
969 {WINED3D_SM4_OP_ROUND_NE, WINED3DSIH_ROUND_NE, "f", "f"},
970 {WINED3D_SM4_OP_ROUND_NI, WINED3DSIH_ROUND_NI, "f", "f"},
971 {WINED3D_SM4_OP_ROUND_PI, WINED3DSIH_ROUND_PI, "f", "f"},
972 {WINED3D_SM4_OP_ROUND_Z, WINED3DSIH_ROUND_Z, "f", "f"},
973 {WINED3D_SM4_OP_RSQ, WINED3DSIH_RSQ, "f", "f"},
974 {WINED3D_SM4_OP_SAMPLE, WINED3DSIH_SAMPLE, "u", "fRS"},
975 {WINED3D_SM4_OP_SAMPLE_C, WINED3DSIH_SAMPLE_C, "f", "fRSf"},
976 {WINED3D_SM4_OP_SAMPLE_C_LZ, WINED3DSIH_SAMPLE_C_LZ, "f", "fRSf"},
977 {WINED3D_SM4_OP_SAMPLE_LOD, WINED3DSIH_SAMPLE_LOD, "u", "fRSf"},
978 {WINED3D_SM4_OP_SAMPLE_GRAD, WINED3DSIH_SAMPLE_GRAD, "u", "fRSff"},
979 {WINED3D_SM4_OP_SAMPLE_B, WINED3DSIH_SAMPLE_B, "u", "fRSf"},
980 {WINED3D_SM4_OP_SQRT, WINED3DSIH_SQRT, "f", "f"},
981 {WINED3D_SM4_OP_SWITCH, WINED3DSIH_SWITCH, "", "u"},
982 {WINED3D_SM4_OP_SINCOS, WINED3DSIH_SINCOS, "ff", "f"},
983 {WINED3D_SM4_OP_UDIV, WINED3DSIH_UDIV, "uu", "uu"},
984 {WINED3D_SM4_OP_ULT, WINED3DSIH_ULT, "u", "uu"},
985 {WINED3D_SM4_OP_UGE, WINED3DSIH_UGE, "u", "uu"},
986 {WINED3D_SM4_OP_UMUL, WINED3DSIH_UMUL, "uu", "uu"},
987 {WINED3D_SM4_OP_UMAX, WINED3DSIH_UMAX, "u", "uu"},
988 {WINED3D_SM4_OP_UMIN, WINED3DSIH_UMIN, "u", "uu"},
989 {WINED3D_SM4_OP_USHR, WINED3DSIH_USHR, "u", "uu"},
990 {WINED3D_SM4_OP_UTOF, WINED3DSIH_UTOF, "f", "u"},
991 {WINED3D_SM4_OP_XOR, WINED3DSIH_XOR, "u", "uu"},
992 {WINED3D_SM4_OP_DCL_RESOURCE, WINED3DSIH_DCL, "R", "",
993 shader_sm4_read_dcl_resource},
994 {WINED3D_SM4_OP_DCL_CONSTANT_BUFFER, WINED3DSIH_DCL_CONSTANT_BUFFER, "", "",
995 shader_sm4_read_dcl_constant_buffer},
996 {WINED3D_SM4_OP_DCL_SAMPLER, WINED3DSIH_DCL_SAMPLER, "", "",
997 shader_sm4_read_dcl_sampler},
998 {WINED3D_SM4_OP_DCL_INDEX_RANGE, WINED3DSIH_DCL_INDEX_RANGE, "", "",
999 shader_sm4_read_dcl_index_range},
1000 {WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY, WINED3DSIH_DCL_OUTPUT_TOPOLOGY, "", "",
1001 shader_sm4_read_dcl_output_topology},
1002 {WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE, WINED3DSIH_DCL_INPUT_PRIMITIVE, "", "",
1003 shader_sm4_read_dcl_input_primitive},
1004 {WINED3D_SM4_OP_DCL_VERTICES_OUT, WINED3DSIH_DCL_VERTICES_OUT, "", "",
1005 shader_sm4_read_declaration_count},
1006 {WINED3D_SM4_OP_DCL_INPUT, WINED3DSIH_DCL_INPUT, "", "",
1007 shader_sm4_read_declaration_dst},
1008 {WINED3D_SM4_OP_DCL_INPUT_SGV, WINED3DSIH_DCL_INPUT_SGV, "", "",
1009 shader_sm4_read_declaration_register_semantic},
1010 {WINED3D_SM4_OP_DCL_INPUT_SIV, WINED3DSIH_DCL_INPUT_SIV, "", "",
1011 shader_sm4_read_declaration_register_semantic},
1012 {WINED3D_SM4_OP_DCL_INPUT_PS, WINED3DSIH_DCL_INPUT_PS, "", "",
1013 shader_sm4_read_dcl_input_ps},
1014 {WINED3D_SM4_OP_DCL_INPUT_PS_SGV, WINED3DSIH_DCL_INPUT_PS_SGV, "", "",
1015 shader_sm4_read_declaration_register_semantic},
1016 {WINED3D_SM4_OP_DCL_INPUT_PS_SIV, WINED3DSIH_DCL_INPUT_PS_SIV, "", "",
1017 shader_sm4_read_dcl_input_ps_siv},
1018 {WINED3D_SM4_OP_DCL_OUTPUT, WINED3DSIH_DCL_OUTPUT, "", "",
1019 shader_sm4_read_declaration_dst},
1020 {WINED3D_SM4_OP_DCL_OUTPUT_SIV, WINED3DSIH_DCL_OUTPUT_SIV, "", "",
1021 shader_sm4_read_declaration_register_semantic},
1022 {WINED3D_SM4_OP_DCL_TEMPS, WINED3DSIH_DCL_TEMPS, "", "",
1023 shader_sm4_read_declaration_count},
1024 {WINED3D_SM4_OP_DCL_INDEXABLE_TEMP, WINED3DSIH_DCL_INDEXABLE_TEMP, "", "",
1025 shader_sm4_read_dcl_indexable_temp},
1026 {WINED3D_SM4_OP_DCL_GLOBAL_FLAGS, WINED3DSIH_DCL_GLOBAL_FLAGS, "", "",
1027 shader_sm4_read_dcl_global_flags},
1028 {WINED3D_SM4_OP_LOD, WINED3DSIH_LOD, "f", "fRS"},
1029 {WINED3D_SM4_OP_GATHER4, WINED3DSIH_GATHER4, "u", "fRS"},
1030 {WINED3D_SM4_OP_SAMPLE_POS, WINED3DSIH_SAMPLE_POS, "f", "Ru"},
1031 {WINED3D_SM4_OP_SAMPLE_INFO, WINED3DSIH_SAMPLE_INFO, "f", "R"},
1032 {WINED3D_SM5_OP_HS_DECLS, WINED3DSIH_HS_DECLS, "", ""},
1033 {WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE, WINED3DSIH_HS_CONTROL_POINT_PHASE, "", ""},
1034 {WINED3D_SM5_OP_HS_FORK_PHASE, WINED3DSIH_HS_FORK_PHASE, "", ""},
1035 {WINED3D_SM5_OP_HS_JOIN_PHASE, WINED3DSIH_HS_JOIN_PHASE, "", ""},
1036 {WINED3D_SM5_OP_EMIT_STREAM, WINED3DSIH_EMIT_STREAM, "", "f"},
1037 {WINED3D_SM5_OP_CUT_STREAM, WINED3DSIH_CUT_STREAM, "", "f"},
1038 {WINED3D_SM5_OP_FCALL, WINED3DSIH_FCALL, "", "O",
1039 shader_sm5_read_fcall},
1040 {WINED3D_SM5_OP_BUFINFO, WINED3DSIH_BUFINFO, "i", "U"},
1041 {WINED3D_SM5_OP_DERIV_RTX_COARSE, WINED3DSIH_DSX_COARSE, "f", "f"},
1042 {WINED3D_SM5_OP_DERIV_RTX_FINE, WINED3DSIH_DSX_FINE, "f", "f"},
1043 {WINED3D_SM5_OP_DERIV_RTY_COARSE, WINED3DSIH_DSY_COARSE, "f", "f"},
1044 {WINED3D_SM5_OP_DERIV_RTY_FINE, WINED3DSIH_DSY_FINE, "f", "f"},
1045 {WINED3D_SM5_OP_GATHER4_C, WINED3DSIH_GATHER4_C, "f", "fRSf"},
1046 {WINED3D_SM5_OP_GATHER4_PO, WINED3DSIH_GATHER4_PO, "f", "fiRS"},
1047 {WINED3D_SM5_OP_GATHER4_PO_C, WINED3DSIH_GATHER4_PO_C, "f", "fiRSf"},
1048 {WINED3D_SM5_OP_RCP, WINED3DSIH_RCP, "f", "f"},
1049 {WINED3D_SM5_OP_F32TOF16, WINED3DSIH_F32TOF16, "u", "f"},
1050 {WINED3D_SM5_OP_F16TOF32, WINED3DSIH_F16TOF32, "f", "u"},
1051 {WINED3D_SM5_OP_COUNTBITS, WINED3DSIH_COUNTBITS, "u", "u"},
1052 {WINED3D_SM5_OP_FIRSTBIT_HI, WINED3DSIH_FIRSTBIT_HI, "u", "u"},
1053 {WINED3D_SM5_OP_FIRSTBIT_LO, WINED3DSIH_FIRSTBIT_LO, "u", "u"},
1054 {WINED3D_SM5_OP_FIRSTBIT_SHI, WINED3DSIH_FIRSTBIT_SHI, "u", "i"},
1055 {WINED3D_SM5_OP_UBFE, WINED3DSIH_UBFE, "u", "iiu"},
1056 {WINED3D_SM5_OP_IBFE, WINED3DSIH_IBFE, "i", "iii"},
1057 {WINED3D_SM5_OP_BFI, WINED3DSIH_BFI, "u", "iiuu"},
1058 {WINED3D_SM5_OP_BFREV, WINED3DSIH_BFREV, "u", "u"},
1059 {WINED3D_SM5_OP_SWAPC, WINED3DSIH_SWAPC, "ff", "uff"},
1060 {WINED3D_SM5_OP_DCL_STREAM, WINED3DSIH_DCL_STREAM, "", "O"},
1061 {WINED3D_SM5_OP_DCL_FUNCTION_BODY, WINED3DSIH_DCL_FUNCTION_BODY, "", "",
1062 shader_sm5_read_dcl_function_body},
1063 {WINED3D_SM5_OP_DCL_FUNCTION_TABLE, WINED3DSIH_DCL_FUNCTION_TABLE, "", "",
1064 shader_sm5_read_dcl_function_table},
1065 {WINED3D_SM5_OP_DCL_INTERFACE, WINED3DSIH_DCL_INTERFACE, "", "",
1066 shader_sm5_read_dcl_interface},
1067 {WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT, WINED3DSIH_DCL_INPUT_CONTROL_POINT_COUNT, "", "",
1068 shader_sm5_read_control_point_count},
1069 {WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT, WINED3DSIH_DCL_OUTPUT_CONTROL_POINT_COUNT, "", "",
1070 shader_sm5_read_control_point_count},
1071 {WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN, WINED3DSIH_DCL_TESSELLATOR_DOMAIN, "", "",
1072 shader_sm5_read_dcl_tessellator_domain},
1073 {WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING, WINED3DSIH_DCL_TESSELLATOR_PARTITIONING, "", "",
1074 shader_sm5_read_dcl_tessellator_partitioning},
1075 {WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, WINED3DSIH_DCL_TESSELLATOR_OUTPUT_PRIMITIVE, "", "",
1076 shader_sm5_read_dcl_tessellator_output_primitive},
1077 {WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR, WINED3DSIH_DCL_HS_MAX_TESSFACTOR, "", "",
1078 shader_sm5_read_dcl_hs_max_tessfactor},
1079 {WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT, WINED3DSIH_DCL_HS_FORK_PHASE_INSTANCE_COUNT, "", "",
1080 shader_sm4_read_declaration_count},
1081 {WINED3D_SM5_OP_DCL_HS_JOIN_PHASE_INSTANCE_COUNT, WINED3DSIH_DCL_HS_JOIN_PHASE_INSTANCE_COUNT, "", "",
1082 shader_sm4_read_declaration_count},
1083 {WINED3D_SM5_OP_DCL_THREAD_GROUP, WINED3DSIH_DCL_THREAD_GROUP, "", "",
1084 shader_sm5_read_dcl_thread_group},
1085 {WINED3D_SM5_OP_DCL_UAV_TYPED, WINED3DSIH_DCL_UAV_TYPED, "", "",
1086 shader_sm4_read_dcl_resource},
1087 {WINED3D_SM5_OP_DCL_UAV_RAW, WINED3DSIH_DCL_UAV_RAW, "", "",
1088 shader_sm5_read_dcl_uav_raw},
1089 {WINED3D_SM5_OP_DCL_UAV_STRUCTURED, WINED3DSIH_DCL_UAV_STRUCTURED, "", "",
1090 shader_sm5_read_dcl_uav_structured},
1091 {WINED3D_SM5_OP_DCL_TGSM_RAW, WINED3DSIH_DCL_TGSM_RAW, "", "",
1092 shader_sm5_read_dcl_tgsm_raw},
1093 {WINED3D_SM5_OP_DCL_TGSM_STRUCTURED, WINED3DSIH_DCL_TGSM_STRUCTURED, "", "",
1094 shader_sm5_read_dcl_tgsm_structured},
1095 {WINED3D_SM5_OP_DCL_RESOURCE_RAW, WINED3DSIH_DCL_RESOURCE_RAW, "", "",
1096 shader_sm5_read_dcl_resource_raw},
1097 {WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED, WINED3DSIH_DCL_RESOURCE_STRUCTURED, "", "",
1098 shader_sm5_read_dcl_resource_structured},
1099 {WINED3D_SM5_OP_LD_UAV_TYPED, WINED3DSIH_LD_UAV_TYPED, "u", "iU"},
1100 {WINED3D_SM5_OP_STORE_UAV_TYPED, WINED3DSIH_STORE_UAV_TYPED, "U", "iu"},
1101 {WINED3D_SM5_OP_LD_RAW, WINED3DSIH_LD_RAW, "u", "iU"},
1102 {WINED3D_SM5_OP_STORE_RAW, WINED3DSIH_STORE_RAW, "U", "iu"},
1103 {WINED3D_SM5_OP_LD_STRUCTURED, WINED3DSIH_LD_STRUCTURED, "u", "iiR"},
1104 {WINED3D_SM5_OP_STORE_STRUCTURED, WINED3DSIH_STORE_STRUCTURED, "U", "iiu"},
1105 {WINED3D_SM5_OP_ATOMIC_AND, WINED3DSIH_ATOMIC_AND, "U", "iu"},
1106 {WINED3D_SM5_OP_ATOMIC_OR, WINED3DSIH_ATOMIC_OR, "U", "iu"},
1107 {WINED3D_SM5_OP_ATOMIC_XOR, WINED3DSIH_ATOMIC_XOR, "U", "iu"},
1108 {WINED3D_SM5_OP_ATOMIC_CMP_STORE, WINED3DSIH_ATOMIC_CMP_STORE, "U", "iuu"},
1109 {WINED3D_SM5_OP_ATOMIC_IADD, WINED3DSIH_ATOMIC_IADD, "U", "ii"},
1110 {WINED3D_SM5_OP_ATOMIC_IMAX, WINED3DSIH_ATOMIC_IMAX, "U", "ii"},
1111 {WINED3D_SM5_OP_ATOMIC_IMIN, WINED3DSIH_ATOMIC_IMIN, "U", "ii"},
1112 {WINED3D_SM5_OP_ATOMIC_UMAX, WINED3DSIH_ATOMIC_UMAX, "U", "iu"},
1113 {WINED3D_SM5_OP_ATOMIC_UMIN, WINED3DSIH_ATOMIC_UMIN, "U", "iu"},
1114 {WINED3D_SM5_OP_IMM_ATOMIC_ALLOC, WINED3DSIH_IMM_ATOMIC_ALLOC, "u", "U"},
1115 {WINED3D_SM5_OP_IMM_ATOMIC_CONSUME, WINED3DSIH_IMM_ATOMIC_CONSUME, "u", "U"},
1116 {WINED3D_SM5_OP_IMM_ATOMIC_IADD, WINED3DSIH_IMM_ATOMIC_IADD, "uU", "ii"},
1117 {WINED3D_SM5_OP_IMM_ATOMIC_AND, WINED3DSIH_IMM_ATOMIC_AND, "uU", "iu"},
1118 {WINED3D_SM5_OP_IMM_ATOMIC_OR, WINED3DSIH_IMM_ATOMIC_OR, "uU", "iu"},
1119 {WINED3D_SM5_OP_IMM_ATOMIC_XOR, WINED3DSIH_IMM_ATOMIC_XOR, "uU", "iu"},
1120 {WINED3D_SM5_OP_IMM_ATOMIC_EXCH, WINED3DSIH_IMM_ATOMIC_EXCH, "uU", "iu"},
1121 {WINED3D_SM5_OP_IMM_ATOMIC_CMP_EXCH, WINED3DSIH_IMM_ATOMIC_CMP_EXCH, "uU", "iuu"},
1122 {WINED3D_SM5_OP_IMM_ATOMIC_IMAX, WINED3DSIH_IMM_ATOMIC_IMAX, "iU", "ii"},
1123 {WINED3D_SM5_OP_IMM_ATOMIC_IMIN, WINED3DSIH_IMM_ATOMIC_IMIN, "iU", "ii"},
1124 {WINED3D_SM5_OP_IMM_ATOMIC_UMAX, WINED3DSIH_IMM_ATOMIC_UMAX, "uU", "iu"},
1125 {WINED3D_SM5_OP_IMM_ATOMIC_UMIN, WINED3DSIH_IMM_ATOMIC_UMIN, "uU", "iu"},
1126 {WINED3D_SM5_OP_SYNC, WINED3DSIH_SYNC, "", "",
1127 shader_sm5_read_sync},
1128 {WINED3D_SM5_OP_EVAL_SAMPLE_INDEX, WINED3DSIH_EVAL_SAMPLE_INDEX, "f", "fi"},
1129 {WINED3D_SM5_OP_DCL_GS_INSTANCES, WINED3DSIH_DCL_GS_INSTANCES, "", "",
1130 shader_sm4_read_declaration_count},
1133 static const enum wined3d_shader_register_type register_type_table[] =
1135 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP,
1136 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT,
1137 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT,
1138 /* WINED3D_SM4_RT_INDEXABLE_TEMP */ WINED3DSPR_IDXTEMP,
1139 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST,
1140 /* UNKNOWN */ ~0u,
1141 /* WINED3D_SM4_RT_SAMPLER */ WINED3DSPR_SAMPLER,
1142 /* WINED3D_SM4_RT_RESOURCE */ WINED3DSPR_RESOURCE,
1143 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER,
1144 /* WINED3D_SM4_RT_IMMCONSTBUFFER */ WINED3DSPR_IMMCONSTBUFFER,
1145 /* UNKNOWN */ ~0u,
1146 /* WINED3D_SM4_RT_PRIMID */ WINED3DSPR_PRIMID,
1147 /* WINED3D_SM4_RT_DEPTHOUT */ WINED3DSPR_DEPTHOUT,
1148 /* WINED3D_SM4_RT_NULL */ WINED3DSPR_NULL,
1149 /* WINED3D_SM4_RT_RASTERIZER */ WINED3DSPR_RASTERIZER,
1150 /* WINED3D_SM4_RT_OMASK */ WINED3DSPR_SAMPLEMASK,
1151 /* WINED3D_SM5_RT_STREAM */ WINED3DSPR_STREAM,
1152 /* WINED3D_SM5_RT_FUNCTION_BODY */ WINED3DSPR_FUNCTIONBODY,
1153 /* UNKNOWN */ ~0u,
1154 /* WINED3D_SM5_RT_FUNCTION_POINTER */ WINED3DSPR_FUNCTIONPOINTER,
1155 /* UNKNOWN */ ~0u,
1156 /* UNKNOWN */ ~0u,
1157 /* WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID */ WINED3DSPR_OUTPOINTID,
1158 /* WINED3D_SM5_RT_FORK_INSTANCE_ID */ WINED3DSPR_FORKINSTID,
1159 /* WINED3D_SM5_RT_JOIN_INSTANCE_ID */ WINED3DSPR_JOININSTID,
1160 /* WINED3D_SM5_RT_INPUT_CONTROL_POINT */ WINED3DSPR_INCONTROLPOINT,
1161 /* WINED3D_SM5_RT_OUTPUT_CONTROL_POINT */ WINED3DSPR_OUTCONTROLPOINT,
1162 /* WINED3D_SM5_RT_PATCH_CONSTANT_DATA */ WINED3DSPR_PATCHCONST,
1163 /* WINED3D_SM5_RT_DOMAIN_LOCATION */ WINED3DSPR_TESSCOORD,
1164 /* UNKNOWN */ ~0u,
1165 /* WINED3D_SM5_RT_UAV */ WINED3DSPR_UAV,
1166 /* WINED3D_SM5_RT_SHARED_MEMORY */ WINED3DSPR_GROUPSHAREDMEM,
1167 /* WINED3D_SM5_RT_THREAD_ID */ WINED3DSPR_THREADID,
1168 /* WINED3D_SM5_RT_THREAD_GROUP_ID */ WINED3DSPR_THREADGROUPID,
1169 /* WINED3D_SM5_RT_LOCAL_THREAD_ID */ WINED3DSPR_LOCALTHREADID,
1170 /* WINED3D_SM5_RT_COVERAGE */ WINED3DSPR_COVERAGE,
1171 /* WINED3D_SM5_RT_LOCAL_THREAD_INDEX */ WINED3DSPR_LOCALTHREADINDEX,
1172 /* WINED3D_SM5_RT_GS_INSTANCE_ID */ WINED3DSPR_GSINSTID,
1173 /* WINED3D_SM5_RT_DEPTHOUT_GREATER_EQUAL */ WINED3DSPR_DEPTHOUTGE,
1174 /* WINED3D_SM5_RT_DEPTHOUT_LESS_EQUAL */ WINED3DSPR_DEPTHOUTLE,
1177 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
1179 unsigned int i;
1181 for (i = 0; i < ARRAY_SIZE(opcode_table); ++i)
1183 if (opcode == opcode_table[i].opcode) return &opcode_table[i];
1186 return NULL;
1189 static void map_register(const struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
1191 switch (priv->shader_version.type)
1193 case WINED3D_SHADER_TYPE_PIXEL:
1194 if (reg->type == WINED3DSPR_OUTPUT)
1196 unsigned int reg_idx = reg->idx[0].offset;
1198 if (reg_idx >= ARRAY_SIZE(priv->output_map))
1200 ERR("Invalid output index %u.\n", reg_idx);
1201 break;
1204 reg->type = WINED3DSPR_COLOROUT;
1205 reg->idx[0].offset = priv->output_map[reg_idx];
1207 break;
1209 default:
1210 break;
1214 static enum wined3d_data_type map_data_type(char t)
1216 switch (t)
1218 case 'f':
1219 return WINED3D_DATA_FLOAT;
1220 case 'i':
1221 return WINED3D_DATA_INT;
1222 case 'u':
1223 return WINED3D_DATA_UINT;
1224 case 'O':
1225 return WINED3D_DATA_OPAQUE;
1226 case 'R':
1227 return WINED3D_DATA_RESOURCE;
1228 case 'S':
1229 return WINED3D_DATA_SAMPLER;
1230 case 'U':
1231 return WINED3D_DATA_UAV;
1232 default:
1233 ERR("Invalid data type '%c'.\n", t);
1234 return WINED3D_DATA_FLOAT;
1238 static enum wined3d_shader_type wined3d_get_sm4_shader_type(const DWORD *byte_code, size_t byte_code_size)
1240 DWORD shader_type;
1242 if (byte_code_size / sizeof(*byte_code) < 1)
1244 WARN("Invalid byte code size %lu.\n", (long)byte_code_size);
1245 return WINED3D_SHADER_TYPE_INVALID;
1248 shader_type = byte_code[0] >> 16;
1249 switch (shader_type)
1251 case WINED3D_SM4_PS:
1252 return WINED3D_SHADER_TYPE_PIXEL;
1253 break;
1254 case WINED3D_SM4_VS:
1255 return WINED3D_SHADER_TYPE_VERTEX;
1256 break;
1257 case WINED3D_SM4_GS:
1258 return WINED3D_SHADER_TYPE_GEOMETRY;
1259 break;
1260 case WINED3D_SM5_HS:
1261 return WINED3D_SHADER_TYPE_HULL;
1262 break;
1263 case WINED3D_SM5_DS:
1264 return WINED3D_SHADER_TYPE_DOMAIN;
1265 break;
1266 case WINED3D_SM5_CS:
1267 return WINED3D_SHADER_TYPE_COMPUTE;
1268 break;
1269 default:
1270 FIXME("Unrecognised shader type %#x.\n", shader_type);
1271 return WINED3D_SHADER_TYPE_INVALID;
1275 static void *shader_sm4_init(const DWORD *byte_code, size_t byte_code_size,
1276 const struct wined3d_shader_signature *output_signature)
1278 DWORD version_token, token_count;
1279 struct wined3d_sm4_data *priv;
1280 unsigned int i;
1282 if (byte_code_size / sizeof(*byte_code) < 2)
1284 WARN("Invalid byte code size %lu.\n", (long)byte_code_size);
1285 return NULL;
1288 version_token = byte_code[0];
1289 TRACE("Version: 0x%08x.\n", version_token);
1290 token_count = byte_code[1];
1291 TRACE("Token count: %u.\n", token_count);
1293 if (token_count < 2 || byte_code_size / sizeof(*byte_code) < token_count)
1295 WARN("Invalid token count %u.\n", token_count);
1296 return NULL;
1299 if (!(priv = heap_alloc(sizeof(*priv))))
1301 ERR("Failed to allocate private data\n");
1302 return NULL;
1305 priv->start = &byte_code[2];
1306 priv->end = &byte_code[token_count];
1308 priv->shader_version.type = wined3d_get_sm4_shader_type(byte_code, byte_code_size);
1309 if (priv->shader_version.type == WINED3D_SHADER_TYPE_INVALID)
1311 heap_free(priv);
1312 return NULL;
1315 priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
1316 priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
1318 memset(priv->output_map, 0xff, sizeof(priv->output_map));
1319 for (i = 0; i < output_signature->element_count; ++i)
1321 struct wined3d_shader_signature_element *e = &output_signature->elements[i];
1323 if (priv->shader_version.type == WINED3D_SHADER_TYPE_PIXEL
1324 && _strnicmp(e->semantic_name, "SV_TARGET", -1))
1325 continue;
1326 if (e->register_idx >= ARRAY_SIZE(priv->output_map))
1328 WARN("Invalid output index %u.\n", e->register_idx);
1329 continue;
1332 priv->output_map[e->register_idx] = e->semantic_idx;
1335 list_init(&priv->src_free);
1336 list_init(&priv->src);
1338 return priv;
1341 static void shader_sm4_free(void *data)
1343 struct wined3d_shader_src_param_entry *e1, *e2;
1344 struct wined3d_sm4_data *priv = data;
1346 list_move_head(&priv->src_free, &priv->src);
1347 LIST_FOR_EACH_ENTRY_SAFE(e1, e2, &priv->src_free, struct wined3d_shader_src_param_entry, entry)
1349 heap_free(e1);
1351 heap_free(priv);
1354 static struct wined3d_shader_src_param *get_src_param(struct wined3d_sm4_data *priv)
1356 struct wined3d_shader_src_param_entry *e;
1357 struct list *elem;
1359 if (!list_empty(&priv->src_free))
1361 elem = list_head(&priv->src_free);
1362 list_remove(elem);
1364 else
1366 if (!(e = heap_alloc(sizeof(*e))))
1367 return NULL;
1368 elem = &e->entry;
1371 list_add_tail(&priv->src, elem);
1372 e = LIST_ENTRY(elem, struct wined3d_shader_src_param_entry, entry);
1373 return &e->param;
1376 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
1378 struct wined3d_sm4_data *priv = data;
1380 *ptr = priv->start;
1381 *shader_version = priv->shader_version;
1384 static BOOL shader_sm4_read_reg_idx(struct wined3d_sm4_data *priv, const DWORD **ptr, const DWORD *end,
1385 DWORD addressing, struct wined3d_shader_register_index *reg_idx)
1387 if (addressing & WINED3D_SM4_ADDRESSING_RELATIVE)
1389 struct wined3d_shader_src_param *rel_addr = get_src_param(priv);
1391 if (!(reg_idx->rel_addr = rel_addr))
1393 ERR("Failed to get src param for relative addressing.\n");
1394 return FALSE;
1397 if (addressing & WINED3D_SM4_ADDRESSING_OFFSET)
1398 reg_idx->offset = *(*ptr)++;
1399 else
1400 reg_idx->offset = 0;
1401 shader_sm4_read_src_param(priv, ptr, end, WINED3D_DATA_INT, rel_addr);
1403 else
1405 reg_idx->rel_addr = NULL;
1406 reg_idx->offset = *(*ptr)++;
1409 return TRUE;
1412 static BOOL shader_sm4_read_param(struct wined3d_sm4_data *priv, const DWORD **ptr, const DWORD *end,
1413 enum wined3d_data_type data_type, struct wined3d_shader_register *param,
1414 enum wined3d_shader_src_modifier *modifier)
1416 enum wined3d_sm4_register_type register_type;
1417 DWORD token, order;
1419 if (*ptr >= end)
1421 WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
1422 return FALSE;
1424 token = *(*ptr)++;
1426 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
1427 if (register_type >= ARRAY_SIZE(register_type_table)
1428 || register_type_table[register_type] == ~0u)
1430 FIXME("Unhandled register type %#x.\n", register_type);
1431 param->type = WINED3DSPR_TEMP;
1433 else
1435 param->type = register_type_table[register_type];
1437 param->data_type = data_type;
1439 if (token & WINED3D_SM4_REGISTER_MODIFIER)
1441 DWORD m;
1443 if (*ptr >= end)
1445 WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
1446 return FALSE;
1448 m = *(*ptr)++;
1450 switch (m)
1452 case 0x41:
1453 *modifier = WINED3DSPSM_NEG;
1454 break;
1456 case 0x81:
1457 *modifier = WINED3DSPSM_ABS;
1458 break;
1460 case 0xc1:
1461 *modifier = WINED3DSPSM_ABSNEG;
1462 break;
1464 default:
1465 FIXME("Skipping modifier 0x%08x.\n", m);
1466 case 0x01:
1467 *modifier = WINED3DSPSM_NONE;
1468 break;
1471 else
1473 *modifier = WINED3DSPSM_NONE;
1476 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
1478 if (order < 1)
1479 param->idx[0].offset = ~0U;
1480 else
1482 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK0) >> WINED3D_SM4_ADDRESSING_SHIFT0;
1483 if (!(shader_sm4_read_reg_idx(priv, ptr, end, addressing, &param->idx[0])))
1485 ERR("Failed to read register index.\n");
1486 return FALSE;
1490 if (order < 2)
1491 param->idx[1].offset = ~0U;
1492 else
1494 DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK1) >> WINED3D_SM4_ADDRESSING_SHIFT1;
1495 if (!(shader_sm4_read_reg_idx(priv, ptr, end, addressing, &param->idx[1])))
1497 ERR("Failed to read register index.\n");
1498 return FALSE;
1502 if (order > 2)
1503 FIXME("Unhandled order %u.\n", order);
1505 if (register_type == WINED3D_SM4_RT_IMMCONST)
1507 enum wined3d_sm4_dimension dimension = (token & WINED3D_SM4_DIMENSION_MASK) >> WINED3D_SM4_DIMENSION_SHIFT;
1509 switch (dimension)
1511 case WINED3D_SM4_DIMENSION_SCALAR:
1512 param->immconst_type = WINED3D_IMMCONST_SCALAR;
1513 if (end - *ptr < 1)
1515 WARN("Invalid ptr %p, end %p.\n", *ptr, end);
1516 return FALSE;
1518 memcpy(param->u.immconst_data, *ptr, 1 * sizeof(DWORD));
1519 *ptr += 1;
1520 break;
1522 case WINED3D_SM4_DIMENSION_VEC4:
1523 param->immconst_type = WINED3D_IMMCONST_VEC4;
1524 if (end - *ptr < 4)
1526 WARN("Invalid ptr %p, end %p.\n", *ptr, end);
1527 return FALSE;
1529 memcpy(param->u.immconst_data, *ptr, 4 * sizeof(DWORD));
1530 *ptr += 4;
1531 break;
1533 default:
1534 FIXME("Unhandled dimension %#x.\n", dimension);
1535 break;
1539 map_register(priv, param);
1541 return TRUE;
1544 static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr, const DWORD *end,
1545 enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param)
1547 DWORD token;
1549 if (*ptr >= end)
1551 WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
1552 return FALSE;
1554 token = **ptr;
1556 if (!shader_sm4_read_param(priv, ptr, end, data_type, &src_param->reg, &src_param->modifiers))
1558 ERR("Failed to read parameter.\n");
1559 return FALSE;
1562 if (src_param->reg.type == WINED3DSPR_IMMCONST)
1564 src_param->swizzle = WINED3DSP_NOSWIZZLE;
1566 else
1568 enum wined3d_sm4_swizzle_type swizzle_type =
1569 (token & WINED3D_SM4_SWIZZLE_TYPE_MASK) >> WINED3D_SM4_SWIZZLE_TYPE_SHIFT;
1571 switch (swizzle_type)
1573 case WINED3D_SM4_SWIZZLE_NONE:
1574 src_param->swizzle = WINED3DSP_NOSWIZZLE;
1575 break;
1577 case WINED3D_SM4_SWIZZLE_SCALAR:
1578 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
1579 src_param->swizzle = (src_param->swizzle & 0x3) * 0x55;
1580 break;
1582 case WINED3D_SM4_SWIZZLE_VEC4:
1583 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
1584 break;
1586 default:
1587 FIXME("Unhandled swizzle type %#x.\n", swizzle_type);
1588 break;
1592 return TRUE;
1595 static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr, const DWORD *end,
1596 enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param)
1598 enum wined3d_shader_src_modifier modifier;
1599 DWORD token;
1601 if (*ptr >= end)
1603 WARN("Invalid ptr %p >= end %p.\n", *ptr, end);
1604 return FALSE;
1606 token = **ptr;
1608 if (!shader_sm4_read_param(priv, ptr, end, data_type, &dst_param->reg, &modifier))
1610 ERR("Failed to read parameter.\n");
1611 return FALSE;
1614 if (modifier != WINED3DSPSM_NONE)
1616 ERR("Invalid source modifier %#x on destination register.\n", modifier);
1617 return FALSE;
1620 dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
1621 dst_param->modifiers = 0;
1622 dst_param->shift = 0;
1624 return TRUE;
1627 static void shader_sm4_read_instruction_modifier(DWORD modifier, struct wined3d_shader_instruction *ins)
1629 enum wined3d_sm4_instruction_modifier modifier_type = modifier & WINED3D_SM4_MODIFIER_MASK;
1631 switch (modifier_type)
1633 case WINED3D_SM4_MODIFIER_AOFFIMMI:
1635 static const DWORD recognized_bits = WINED3D_SM4_INSTRUCTION_MODIFIER
1636 | WINED3D_SM4_MODIFIER_MASK
1637 | WINED3D_SM4_AOFFIMMI_U_MASK
1638 | WINED3D_SM4_AOFFIMMI_V_MASK
1639 | WINED3D_SM4_AOFFIMMI_W_MASK;
1641 /* Bit fields are used for sign extension. */
1642 struct
1644 int u : 4;
1645 int v : 4;
1646 int w : 4;
1647 } aoffimmi;
1649 if (modifier & ~recognized_bits)
1650 FIXME("Unhandled instruction modifier %#x.\n", modifier);
1652 aoffimmi.u = (modifier & WINED3D_SM4_AOFFIMMI_U_MASK) >> WINED3D_SM4_AOFFIMMI_U_SHIFT;
1653 aoffimmi.v = (modifier & WINED3D_SM4_AOFFIMMI_V_MASK) >> WINED3D_SM4_AOFFIMMI_V_SHIFT;
1654 aoffimmi.w = (modifier & WINED3D_SM4_AOFFIMMI_W_MASK) >> WINED3D_SM4_AOFFIMMI_W_SHIFT;
1655 ins->texel_offset.u = aoffimmi.u;
1656 ins->texel_offset.v = aoffimmi.v;
1657 ins->texel_offset.w = aoffimmi.w;
1658 break;
1661 case WINED3D_SM5_MODIFIER_DATA_TYPE:
1663 DWORD components = (modifier & WINED3D_SM5_MODIFIER_DATA_TYPE_MASK) >> WINED3D_SM5_MODIFIER_DATA_TYPE_SHIFT;
1664 enum wined3d_sm4_data_type data_type = components & 0xf;
1666 if ((components & 0xfff0) != (components & 0xf) * 0x1110)
1667 FIXME("Components (%#x) have different data types.\n", components);
1668 ins->resource_data_type = data_type_table[data_type];
1669 break;
1672 case WINED3D_SM5_MODIFIER_RESOURCE_TYPE:
1674 enum wined3d_sm4_resource_type resource_type
1675 = (modifier & WINED3D_SM5_MODIFIER_RESOURCE_TYPE_MASK) >> WINED3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT;
1677 ins->resource_type = resource_type_table[resource_type];
1678 break;
1681 default:
1682 FIXME("Unhandled instruction modifier %#x.\n", modifier);
1686 static void shader_sm4_read_instruction(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins)
1688 const struct wined3d_sm4_opcode_info *opcode_info;
1689 DWORD opcode_token, opcode, previous_token;
1690 struct wined3d_sm4_data *priv = data;
1691 unsigned int i, len;
1692 SIZE_T remaining;
1693 const DWORD *p;
1694 DWORD precise;
1696 list_move_head(&priv->src_free, &priv->src);
1698 if (*ptr >= priv->end)
1700 WARN("End of byte-code, failed to read opcode.\n");
1701 goto fail;
1703 remaining = priv->end - *ptr;
1705 opcode_token = *(*ptr)++;
1706 opcode = opcode_token & WINED3D_SM4_OPCODE_MASK;
1708 len = ((opcode_token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT);
1709 if (!len)
1711 if (remaining < 2)
1713 WARN("End of byte-code, failed to read length token.\n");
1714 goto fail;
1716 len = **ptr;
1718 if (!len || remaining < len)
1720 WARN("Read invalid length %u (remaining %lu).\n", len, remaining);
1721 goto fail;
1723 --len;
1725 if (TRACE_ON(d3d_bytecode))
1727 TRACE_(d3d_bytecode)("[ %08x ", opcode_token);
1728 for (i = 0; i < len; ++i)
1730 TRACE_(d3d_bytecode)("%08x ", (*ptr)[i]);
1732 TRACE_(d3d_bytecode)("]\n");
1735 if (!(opcode_info = get_opcode_info(opcode)))
1737 FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode, opcode_token);
1738 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1739 *ptr += len;
1740 return;
1743 ins->handler_idx = opcode_info->handler_idx;
1744 ins->flags = 0;
1745 ins->coissue = 0;
1746 ins->predicate = NULL;
1747 ins->dst_count = strlen(opcode_info->dst_info);
1748 ins->dst = priv->dst_param;
1749 ins->src_count = strlen(opcode_info->src_info);
1750 ins->src = priv->src_param;
1751 ins->resource_type = WINED3D_SHADER_RESOURCE_NONE;
1752 ins->resource_data_type = WINED3D_DATA_FLOAT;
1753 memset(&ins->texel_offset, 0, sizeof(ins->texel_offset));
1755 p = *ptr;
1756 *ptr += len;
1758 if (opcode_info->read_opcode_func)
1760 opcode_info->read_opcode_func(ins, opcode, opcode_token, p, len, priv);
1762 else
1764 enum wined3d_shader_dst_modifier instruction_dst_modifier = WINED3DSPDM_NONE;
1766 previous_token = opcode_token;
1767 while (previous_token & WINED3D_SM4_INSTRUCTION_MODIFIER && p != *ptr)
1768 shader_sm4_read_instruction_modifier(previous_token = *p++, ins);
1770 ins->flags = (opcode_token & WINED3D_SM4_INSTRUCTION_FLAGS_MASK) >> WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT;
1771 if (ins->flags & WINED3D_SM4_INSTRUCTION_FLAG_SATURATE)
1773 ins->flags &= ~WINED3D_SM4_INSTRUCTION_FLAG_SATURATE;
1774 instruction_dst_modifier = WINED3DSPDM_SATURATE;
1776 precise = (opcode_token & WINED3D_SM5_PRECISE_MASK) >> WINED3D_SM5_PRECISE_SHIFT;
1777 ins->flags |= precise << WINED3DSI_PRECISE_SHIFT;
1779 for (i = 0; i < ins->dst_count; ++i)
1781 if (!(shader_sm4_read_dst_param(priv, &p, *ptr, map_data_type(opcode_info->dst_info[i]),
1782 &priv->dst_param[i])))
1784 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1785 return;
1787 priv->dst_param[i].modifiers |= instruction_dst_modifier;
1790 for (i = 0; i < ins->src_count; ++i)
1792 if (!(shader_sm4_read_src_param(priv, &p, *ptr, map_data_type(opcode_info->src_info[i]),
1793 &priv->src_param[i])))
1795 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1796 return;
1801 return;
1803 fail:
1804 *ptr = priv->end;
1805 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
1806 return;
1809 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
1811 struct wined3d_sm4_data *priv = data;
1812 return *ptr == priv->end;
1815 const struct wined3d_shader_frontend sm4_shader_frontend =
1817 shader_sm4_init,
1818 shader_sm4_free,
1819 shader_sm4_read_header,
1820 shader_sm4_read_instruction,
1821 shader_sm4_is_end,
1824 #define TAG_AON9 WINEMAKEFOURCC('A', 'o', 'n', '9')
1825 #define TAG_DXBC WINEMAKEFOURCC('D', 'X', 'B', 'C')
1826 #define TAG_ISG1 WINEMAKEFOURCC('I', 'S', 'G', '1')
1827 #define TAG_ISGN WINEMAKEFOURCC('I', 'S', 'G', 'N')
1828 #define TAG_OSG1 WINEMAKEFOURCC('O', 'S', 'G', '1')
1829 #define TAG_OSG5 WINEMAKEFOURCC('O', 'S', 'G', '5')
1830 #define TAG_OSGN WINEMAKEFOURCC('O', 'S', 'G', 'N')
1831 #define TAG_PCSG WINEMAKEFOURCC('P', 'C', 'S', 'G')
1832 #define TAG_PSG1 WINEMAKEFOURCC('P', 'S', 'G', '1')
1833 #define TAG_SHDR WINEMAKEFOURCC('S', 'H', 'D', 'R')
1834 #define TAG_SHEX WINEMAKEFOURCC('S', 'H', 'E', 'X')
1836 struct aon9_header
1838 DWORD chunk_size;
1839 DWORD shader_version;
1840 DWORD unknown;
1841 DWORD byte_code_offset;
1844 struct shader_handler_context
1846 struct wined3d_shader *shader;
1847 enum wined3d_shader_byte_code_format *format;
1848 unsigned int max_version;
1851 static void read_dword(const char **ptr, DWORD *d)
1853 memcpy(d, *ptr, sizeof(*d));
1854 *ptr += sizeof(*d);
1857 static BOOL require_space(size_t offset, size_t count, size_t size, size_t data_size)
1859 return !count || (data_size - offset) / count >= size;
1862 static void skip_dword_unknown(const char **ptr, unsigned int count)
1864 unsigned int i;
1865 DWORD d;
1867 WARN("Skipping %u unknown DWORDs:\n", count);
1868 for (i = 0; i < count; ++i)
1870 read_dword(ptr, &d);
1871 WARN("\t0x%08x\n", d);
1875 static HRESULT parse_dxbc(const char *data, SIZE_T data_size,
1876 HRESULT (*chunk_handler)(const char *data, DWORD data_size, DWORD tag, void *ctx), void *ctx)
1878 const char *ptr = data;
1879 HRESULT hr = S_OK;
1880 DWORD chunk_count;
1881 DWORD total_size;
1882 unsigned int i;
1883 DWORD version;
1884 DWORD tag;
1886 read_dword(&ptr, &tag);
1887 TRACE("tag: %s.\n", debugstr_an((const char *)&tag, 4));
1889 if (tag != TAG_DXBC)
1891 WARN("Wrong tag.\n");
1892 return E_INVALIDARG;
1895 WARN("Ignoring DXBC checksum.\n");
1896 skip_dword_unknown(&ptr, 4);
1898 read_dword(&ptr, &version);
1899 TRACE("version: %#x.\n", version);
1900 if (version != 0x00000001)
1902 WARN("Got unexpected DXBC version %#x.\n", version);
1903 return E_INVALIDARG;
1906 read_dword(&ptr, &total_size);
1907 TRACE("total size: %#x\n", total_size);
1909 read_dword(&ptr, &chunk_count);
1910 TRACE("chunk count: %#x\n", chunk_count);
1912 for (i = 0; i < chunk_count; ++i)
1914 DWORD chunk_tag, chunk_size;
1915 const char *chunk_ptr;
1916 DWORD chunk_offset;
1918 read_dword(&ptr, &chunk_offset);
1919 TRACE("chunk %u at offset %#x\n", i, chunk_offset);
1921 if (chunk_offset >= data_size || !require_space(chunk_offset, 2, sizeof(DWORD), data_size))
1923 WARN("Invalid chunk offset %#x (data size %#lx).\n", chunk_offset, data_size);
1924 return E_FAIL;
1927 chunk_ptr = data + chunk_offset;
1929 read_dword(&chunk_ptr, &chunk_tag);
1930 read_dword(&chunk_ptr, &chunk_size);
1932 if (!require_space(chunk_ptr - data, 1, chunk_size, data_size))
1934 WARN("Invalid chunk size %#x (data size %#lx, chunk offset %#x).\n",
1935 chunk_size, data_size, chunk_offset);
1936 return E_FAIL;
1939 if (FAILED(hr = chunk_handler(chunk_ptr, chunk_size, chunk_tag, ctx)))
1940 break;
1943 return hr;
1946 static const char *shader_get_string(const char *data, size_t data_size, DWORD offset)
1948 if (offset >= data_size)
1950 WARN("Invalid offset %#x (data size %#lx).\n", offset, (long)data_size);
1951 return NULL;
1954 if (!memchr( data + offset, 0, data_size - offset ))
1955 return NULL;
1957 return data + offset;
1960 static HRESULT shader_parse_signature(DWORD tag, const char *data, DWORD data_size,
1961 struct wined3d_shader_signature *s)
1963 struct wined3d_shader_signature_element *e;
1964 bool has_stream_index, has_min_precision;
1965 const char *ptr = data;
1966 unsigned int i;
1967 DWORD count;
1969 if (!require_space(0, 2, sizeof(DWORD), data_size))
1971 WARN("Invalid data size %#x.\n", data_size);
1972 return E_INVALIDARG;
1975 read_dword(&ptr, &count);
1976 TRACE("%u elements.\n", count);
1978 skip_dword_unknown(&ptr, 1); /* It seems to always be 0x00000008. */
1980 if (!require_space(ptr - data, count, 6 * sizeof(DWORD), data_size))
1982 WARN("Invalid count %#x (data size %#x).\n", count, data_size);
1983 return E_INVALIDARG;
1986 if (!(e = heap_calloc(count, sizeof(*e))))
1988 ERR("Failed to allocate input signature memory.\n");
1989 return E_OUTOFMEMORY;
1992 has_min_precision = tag == TAG_OSG1 || tag == TAG_PSG1 || tag == TAG_ISG1;
1993 has_stream_index = tag == TAG_OSG5 || has_min_precision;
1995 for (i = 0; i < count; ++i)
1997 DWORD name_offset;
1999 if (has_stream_index)
2000 read_dword(&ptr, &e[i].stream_idx);
2001 else
2002 e[i].stream_idx = 0;
2003 read_dword(&ptr, &name_offset);
2004 if (!(e[i].semantic_name = shader_get_string(data, data_size, name_offset)))
2006 WARN("Invalid name offset %#x (data size %#x).\n", name_offset, data_size);
2007 heap_free(e);
2008 return E_INVALIDARG;
2010 read_dword(&ptr, &e[i].semantic_idx);
2011 read_dword(&ptr, &e[i].sysval_semantic);
2012 read_dword(&ptr, &e[i].component_type);
2013 read_dword(&ptr, &e[i].register_idx);
2014 read_dword(&ptr, &e[i].mask);
2016 if (has_min_precision)
2017 read_dword(&ptr, &e[i].min_precision);
2018 else
2019 e[i].min_precision = 0;
2021 TRACE("Stream: %u, semantic: %s, semantic idx: %u, sysval_semantic %#x, "
2022 "type %u, register idx: %u, use_mask %#x, input_mask %#x, min_precision %u.\n",
2023 e[i].stream_idx, debugstr_a(e[i].semantic_name), e[i].semantic_idx, e[i].sysval_semantic,
2024 e[i].component_type, e[i].register_idx, (e[i].mask >> 8) & 0xff, e[i].mask & 0xff, e[i].min_precision);
2027 s->elements = e;
2028 s->element_count = count;
2030 return S_OK;
2033 static HRESULT shader_dxbc_chunk_handler(const char *data, DWORD data_size, DWORD tag, void *context)
2035 struct shader_handler_context *ctx = context;
2036 struct wined3d_shader *shader = ctx->shader;
2037 HRESULT hr;
2039 switch (tag)
2041 case TAG_ISGN:
2042 case TAG_ISG1:
2043 if (ctx->max_version < 4)
2045 TRACE("Skipping shader input signature.\n");
2046 break;
2048 if (shader->input_signature.elements)
2050 FIXME("Multiple input signatures.\n");
2051 break;
2053 if (FAILED(hr = shader_parse_signature(tag, data, data_size, &shader->input_signature)))
2054 return hr;
2055 break;
2057 case TAG_OSGN:
2058 case TAG_OSG1:
2059 case TAG_OSG5:
2060 if (ctx->max_version < 4)
2062 TRACE("Skipping shader output signature.\n");
2063 break;
2065 if (shader->output_signature.elements)
2067 FIXME("Multiple output signatures.\n");
2068 break;
2070 if (FAILED(hr = shader_parse_signature(tag, data, data_size, &shader->output_signature)))
2071 return hr;
2072 break;
2074 case TAG_PCSG:
2075 case TAG_PSG1:
2076 if (shader->patch_constant_signature.elements)
2078 FIXME("Multiple patch constant signatures.\n");
2079 break;
2081 if (FAILED(hr = shader_parse_signature(tag, data, data_size, &shader->patch_constant_signature)))
2082 return hr;
2083 break;
2085 case TAG_SHDR:
2086 case TAG_SHEX:
2087 if (ctx->max_version < 4)
2089 TRACE("Skipping SM4+ shader.\n");
2090 break;
2092 if (shader->function)
2093 FIXME("Multiple shader code chunks.\n");
2094 shader->function = (const DWORD *)data;
2095 shader->functionLength = data_size;
2096 *ctx->format = WINED3D_SHADER_BYTE_CODE_FORMAT_SM4;
2097 break;
2099 case TAG_AON9:
2100 if (ctx->max_version < 4)
2102 const struct aon9_header *header = (const struct aon9_header *)data;
2103 unsigned int unknown_dword_count;
2104 const char *byte_code;
2106 if (data_size < sizeof(*header))
2108 WARN("Invalid Aon9 data size %#x.\n", data_size);
2109 return E_FAIL;
2111 byte_code = data + header->byte_code_offset;
2112 unknown_dword_count = (header->byte_code_offset - sizeof(*header)) / sizeof(DWORD);
2114 if (data_size - 2 * sizeof(DWORD) < header->byte_code_offset)
2116 WARN("Invalid byte code offset %#x (size %#x).\n", header->byte_code_offset, data_size);
2117 return E_FAIL;
2119 FIXME("Skipping %u unknown DWORDs.\n", unknown_dword_count);
2121 if (shader->function)
2122 FIXME("Multiple shader code chunks.\n");
2123 shader->function = (const DWORD *)byte_code;
2124 shader->functionLength = data_size - header->byte_code_offset;
2125 *ctx->format = WINED3D_SHADER_BYTE_CODE_FORMAT_SM1;
2126 TRACE("Feature level 9 shader version 0%08x, 0%08x.\n",
2127 header->shader_version, *shader->function);
2129 else
2131 TRACE("Skipping feature level 9 shader code.\n");
2133 break;
2135 default:
2136 TRACE("Skipping chunk %s.\n", debugstr_an((const char *)&tag, 4));
2137 break;
2140 return S_OK;
2143 HRESULT shader_extract_from_dxbc(struct wined3d_shader *shader,
2144 unsigned int max_shader_version, enum wined3d_shader_byte_code_format *format)
2146 struct shader_handler_context ctx;
2147 HRESULT hr;
2149 ctx.shader = shader;
2150 ctx.format = format;
2151 ctx.max_version = max_shader_version;
2153 hr = parse_dxbc(shader->byte_code, shader->byte_code_size, shader_dxbc_chunk_handler, &ctx);
2154 if (!shader->function)
2155 hr = E_INVALIDARG;
2157 if (FAILED(hr))
2158 WARN("Failed to parse DXBC, hr %#x.\n", hr);
2160 return hr;
2163 static HRESULT shader_isgn_chunk_handler(const char *data, DWORD data_size, DWORD tag, void *ctx)
2165 struct wined3d_shader_signature *is = ctx;
2167 if (tag != TAG_ISGN)
2168 return S_OK;
2170 if (is->elements)
2172 FIXME("Multiple shader signatures.\n");
2173 return S_OK;
2176 return shader_parse_signature(tag, data, data_size, is);
2179 HRESULT CDECL wined3d_extract_shader_input_signature_from_dxbc(struct wined3d_shader_signature *signature,
2180 const void *code, SIZE_T code_size)
2182 memset(signature, 0, sizeof(*signature));
2183 return parse_dxbc(code, code_size, shader_isgn_chunk_handler, signature);