2 * Copyright 2009 Henri Verbeet for CodeWeavers
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
21 #include "wined3d_private.h"
23 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader
);
24 WINE_DECLARE_DEBUG_CHANNEL(d3d_bytecode
);
26 #define WINED3D_SM4_INSTRUCTION_MODIFIER (0x1u << 31)
28 #define WINED3D_SM4_MODIFIER_MASK 0x3fu
30 #define WINED3D_SM5_MODIFIER_DATA_TYPE_SHIFT 6
31 #define WINED3D_SM5_MODIFIER_DATA_TYPE_MASK (0xffffu << WINED3D_SM5_MODIFIER_DATA_TYPE_SHIFT)
33 #define WINED3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT 6
34 #define WINED3D_SM5_MODIFIER_RESOURCE_TYPE_MASK (0xfu << WINED3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT)
36 #define WINED3D_SM4_AOFFIMMI_U_SHIFT 9
37 #define WINED3D_SM4_AOFFIMMI_U_MASK (0xfu << WINED3D_SM4_AOFFIMMI_U_SHIFT)
38 #define WINED3D_SM4_AOFFIMMI_V_SHIFT 13
39 #define WINED3D_SM4_AOFFIMMI_V_MASK (0xfu << WINED3D_SM4_AOFFIMMI_V_SHIFT)
40 #define WINED3D_SM4_AOFFIMMI_W_SHIFT 17
41 #define WINED3D_SM4_AOFFIMMI_W_MASK (0xfu << WINED3D_SM4_AOFFIMMI_W_SHIFT)
43 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
44 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0x1fu << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
46 #define WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT 11
47 #define WINED3D_SM4_INSTRUCTION_FLAGS_MASK (0x7u << WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT)
49 #define WINED3D_SM4_RESOURCE_TYPE_SHIFT 11
50 #define WINED3D_SM4_RESOURCE_TYPE_MASK (0xfu << WINED3D_SM4_RESOURCE_TYPE_SHIFT)
52 #define WINED3D_SM4_PRIMITIVE_TYPE_SHIFT 11
53 #define WINED3D_SM4_PRIMITIVE_TYPE_MASK (0x3fu << WINED3D_SM4_PRIMITIVE_TYPE_SHIFT)
55 #define WINED3D_SM4_INDEX_TYPE_SHIFT 11
56 #define WINED3D_SM4_INDEX_TYPE_MASK (0x1u << WINED3D_SM4_INDEX_TYPE_SHIFT)
58 #define WINED3D_SM4_SAMPLER_MODE_SHIFT 11
59 #define WINED3D_SM4_SAMPLER_MODE_MASK (0xfu << WINED3D_SM4_SAMPLER_MODE_SHIFT)
61 #define WINED3D_SM4_SHADER_DATA_TYPE_SHIFT 11
62 #define WINED3D_SM4_SHADER_DATA_TYPE_MASK (0xfu << WINED3D_SM4_SHADER_DATA_TYPE_SHIFT)
64 #define WINED3D_SM4_INTERPOLATION_MODE_SHIFT 11
65 #define WINED3D_SM4_INTERPOLATION_MODE_MASK (0xfu << WINED3D_SM4_INTERPOLATION_MODE_SHIFT)
67 #define WINED3D_SM4_GLOBAL_FLAGS_SHIFT 11
68 #define WINED3D_SM4_GLOBAL_FLAGS_MASK (0xffu << WINED3D_SM4_GLOBAL_FLAGS_SHIFT)
70 #define WINED3D_SM5_PRECISE_SHIFT 19
71 #define WINED3D_SM5_PRECISE_MASK (0xfu << WINED3D_SM5_PRECISE_SHIFT)
73 #define WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT 11
74 #define WINED3D_SM5_CONTROL_POINT_COUNT_MASK (0xffu << WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT)
76 #define WINED3D_SM5_FP_ARRAY_SIZE_SHIFT 16
77 #define WINED3D_SM5_FP_TABLE_COUNT_MASK 0xffffu
79 #define WINED3D_SM5_UAV_FLAGS_SHIFT 15
80 #define WINED3D_SM5_UAV_FLAGS_MASK (0x1ffu << WINED3D_SM5_UAV_FLAGS_SHIFT)
82 #define WINED3D_SM5_SYNC_FLAGS_SHIFT 11
83 #define WINED3D_SM5_SYNC_FLAGS_MASK (0xffu << WINED3D_SM5_SYNC_FLAGS_SHIFT)
85 #define WINED3D_SM5_TESSELLATOR_SHIFT 11
86 #define WINED3D_SM5_TESSELLATOR_MASK (0xfu << WINED3D_SM5_TESSELLATOR_SHIFT)
88 #define WINED3D_SM4_OPCODE_MASK 0xff
90 #define WINED3D_SM4_REGISTER_MODIFIER (0x1u << 31)
92 #define WINED3D_SM4_ADDRESSING_SHIFT1 25
93 #define WINED3D_SM4_ADDRESSING_MASK1 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT1)
95 #define WINED3D_SM4_ADDRESSING_SHIFT0 22
96 #define WINED3D_SM4_ADDRESSING_MASK0 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT0)
98 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
99 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3u << WINED3D_SM4_REGISTER_ORDER_SHIFT)
101 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
102 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xffu << WINED3D_SM4_REGISTER_TYPE_SHIFT)
104 #define WINED3D_SM4_SWIZZLE_TYPE_SHIFT 2
105 #define WINED3D_SM4_SWIZZLE_TYPE_MASK (0x3u << WINED3D_SM4_SWIZZLE_TYPE_SHIFT)
107 #define WINED3D_SM4_DIMENSION_SHIFT 0
108 #define WINED3D_SM4_DIMENSION_MASK (0x3u << WINED3D_SM4_DIMENSION_SHIFT)
110 #define WINED3D_SM4_WRITEMASK_SHIFT 4
111 #define WINED3D_SM4_WRITEMASK_MASK (0xfu << WINED3D_SM4_WRITEMASK_SHIFT)
113 #define WINED3D_SM4_SWIZZLE_SHIFT 4
114 #define WINED3D_SM4_SWIZZLE_MASK (0xffu << WINED3D_SM4_SWIZZLE_SHIFT)
116 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
117 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
119 #define WINED3D_SM4_ADDRESSING_RELATIVE 0x2
120 #define WINED3D_SM4_ADDRESSING_OFFSET 0x1
122 #define WINED3D_SM4_INSTRUCTION_FLAG_SATURATE 0x4
124 #define WINED3D_SM4_CONDITIONAL_NZ (0x1u << 18)
126 enum wined3d_sm4_opcode
128 WINED3D_SM4_OP_ADD
= 0x00,
129 WINED3D_SM4_OP_AND
= 0x01,
130 WINED3D_SM4_OP_BREAK
= 0x02,
131 WINED3D_SM4_OP_BREAKC
= 0x03,
132 WINED3D_SM4_OP_CASE
= 0x06,
133 WINED3D_SM4_OP_CONTINUE
= 0x07,
134 WINED3D_SM4_OP_CONTINUEC
= 0x08,
135 WINED3D_SM4_OP_CUT
= 0x09,
136 WINED3D_SM4_OP_DEFAULT
= 0x0a,
137 WINED3D_SM4_OP_DERIV_RTX
= 0x0b,
138 WINED3D_SM4_OP_DERIV_RTY
= 0x0c,
139 WINED3D_SM4_OP_DISCARD
= 0x0d,
140 WINED3D_SM4_OP_DIV
= 0x0e,
141 WINED3D_SM4_OP_DP2
= 0x0f,
142 WINED3D_SM4_OP_DP3
= 0x10,
143 WINED3D_SM4_OP_DP4
= 0x11,
144 WINED3D_SM4_OP_ELSE
= 0x12,
145 WINED3D_SM4_OP_EMIT
= 0x13,
146 WINED3D_SM4_OP_ENDIF
= 0x15,
147 WINED3D_SM4_OP_ENDLOOP
= 0x16,
148 WINED3D_SM4_OP_ENDSWITCH
= 0x17,
149 WINED3D_SM4_OP_EQ
= 0x18,
150 WINED3D_SM4_OP_EXP
= 0x19,
151 WINED3D_SM4_OP_FRC
= 0x1a,
152 WINED3D_SM4_OP_FTOI
= 0x1b,
153 WINED3D_SM4_OP_FTOU
= 0x1c,
154 WINED3D_SM4_OP_GE
= 0x1d,
155 WINED3D_SM4_OP_IADD
= 0x1e,
156 WINED3D_SM4_OP_IF
= 0x1f,
157 WINED3D_SM4_OP_IEQ
= 0x20,
158 WINED3D_SM4_OP_IGE
= 0x21,
159 WINED3D_SM4_OP_ILT
= 0x22,
160 WINED3D_SM4_OP_IMAD
= 0x23,
161 WINED3D_SM4_OP_IMAX
= 0x24,
162 WINED3D_SM4_OP_IMIN
= 0x25,
163 WINED3D_SM4_OP_IMUL
= 0x26,
164 WINED3D_SM4_OP_INE
= 0x27,
165 WINED3D_SM4_OP_INEG
= 0x28,
166 WINED3D_SM4_OP_ISHL
= 0x29,
167 WINED3D_SM4_OP_ISHR
= 0x2a,
168 WINED3D_SM4_OP_ITOF
= 0x2b,
169 WINED3D_SM4_OP_LABEL
= 0x2c,
170 WINED3D_SM4_OP_LD
= 0x2d,
171 WINED3D_SM4_OP_LD2DMS
= 0x2e,
172 WINED3D_SM4_OP_LOG
= 0x2f,
173 WINED3D_SM4_OP_LOOP
= 0x30,
174 WINED3D_SM4_OP_LT
= 0x31,
175 WINED3D_SM4_OP_MAD
= 0x32,
176 WINED3D_SM4_OP_MIN
= 0x33,
177 WINED3D_SM4_OP_MAX
= 0x34,
178 WINED3D_SM4_OP_SHADER_DATA
= 0x35,
179 WINED3D_SM4_OP_MOV
= 0x36,
180 WINED3D_SM4_OP_MOVC
= 0x37,
181 WINED3D_SM4_OP_MUL
= 0x38,
182 WINED3D_SM4_OP_NE
= 0x39,
183 WINED3D_SM4_OP_NOP
= 0x3a,
184 WINED3D_SM4_OP_NOT
= 0x3b,
185 WINED3D_SM4_OP_OR
= 0x3c,
186 WINED3D_SM4_OP_RESINFO
= 0x3d,
187 WINED3D_SM4_OP_RET
= 0x3e,
188 WINED3D_SM4_OP_RETC
= 0x3f,
189 WINED3D_SM4_OP_ROUND_NE
= 0x40,
190 WINED3D_SM4_OP_ROUND_NI
= 0x41,
191 WINED3D_SM4_OP_ROUND_PI
= 0x42,
192 WINED3D_SM4_OP_ROUND_Z
= 0x43,
193 WINED3D_SM4_OP_RSQ
= 0x44,
194 WINED3D_SM4_OP_SAMPLE
= 0x45,
195 WINED3D_SM4_OP_SAMPLE_C
= 0x46,
196 WINED3D_SM4_OP_SAMPLE_C_LZ
= 0x47,
197 WINED3D_SM4_OP_SAMPLE_LOD
= 0x48,
198 WINED3D_SM4_OP_SAMPLE_GRAD
= 0x49,
199 WINED3D_SM4_OP_SAMPLE_B
= 0x4a,
200 WINED3D_SM4_OP_SQRT
= 0x4b,
201 WINED3D_SM4_OP_SWITCH
= 0x4c,
202 WINED3D_SM4_OP_SINCOS
= 0x4d,
203 WINED3D_SM4_OP_UDIV
= 0x4e,
204 WINED3D_SM4_OP_ULT
= 0x4f,
205 WINED3D_SM4_OP_UGE
= 0x50,
206 WINED3D_SM4_OP_UMUL
= 0x51,
207 WINED3D_SM4_OP_UMAX
= 0x53,
208 WINED3D_SM4_OP_UMIN
= 0x54,
209 WINED3D_SM4_OP_USHR
= 0x55,
210 WINED3D_SM4_OP_UTOF
= 0x56,
211 WINED3D_SM4_OP_XOR
= 0x57,
212 WINED3D_SM4_OP_DCL_RESOURCE
= 0x58,
213 WINED3D_SM4_OP_DCL_CONSTANT_BUFFER
= 0x59,
214 WINED3D_SM4_OP_DCL_SAMPLER
= 0x5a,
215 WINED3D_SM4_OP_DCL_INDEX_RANGE
= 0x5b,
216 WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY
= 0x5c,
217 WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE
= 0x5d,
218 WINED3D_SM4_OP_DCL_VERTICES_OUT
= 0x5e,
219 WINED3D_SM4_OP_DCL_INPUT
= 0x5f,
220 WINED3D_SM4_OP_DCL_INPUT_SGV
= 0x60,
221 WINED3D_SM4_OP_DCL_INPUT_SIV
= 0x61,
222 WINED3D_SM4_OP_DCL_INPUT_PS
= 0x62,
223 WINED3D_SM4_OP_DCL_INPUT_PS_SGV
= 0x63,
224 WINED3D_SM4_OP_DCL_INPUT_PS_SIV
= 0x64,
225 WINED3D_SM4_OP_DCL_OUTPUT
= 0x65,
226 WINED3D_SM4_OP_DCL_OUTPUT_SIV
= 0x67,
227 WINED3D_SM4_OP_DCL_TEMPS
= 0x68,
228 WINED3D_SM4_OP_DCL_INDEXABLE_TEMP
= 0x69,
229 WINED3D_SM4_OP_DCL_GLOBAL_FLAGS
= 0x6a,
230 WINED3D_SM4_OP_LOD
= 0x6c,
231 WINED3D_SM4_OP_GATHER4
= 0x6d,
232 WINED3D_SM4_OP_SAMPLE_POS
= 0x6e,
233 WINED3D_SM4_OP_SAMPLE_INFO
= 0x6f,
234 WINED3D_SM5_OP_HS_DECLS
= 0x71,
235 WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE
= 0x72,
236 WINED3D_SM5_OP_HS_FORK_PHASE
= 0x73,
237 WINED3D_SM5_OP_HS_JOIN_PHASE
= 0x74,
238 WINED3D_SM5_OP_EMIT_STREAM
= 0x75,
239 WINED3D_SM5_OP_CUT_STREAM
= 0x76,
240 WINED3D_SM5_OP_FCALL
= 0x78,
241 WINED3D_SM5_OP_BUFINFO
= 0x79,
242 WINED3D_SM5_OP_DERIV_RTX_COARSE
= 0x7a,
243 WINED3D_SM5_OP_DERIV_RTX_FINE
= 0x7b,
244 WINED3D_SM5_OP_DERIV_RTY_COARSE
= 0x7c,
245 WINED3D_SM5_OP_DERIV_RTY_FINE
= 0x7d,
246 WINED3D_SM5_OP_GATHER4_C
= 0x7e,
247 WINED3D_SM5_OP_GATHER4_PO
= 0x7f,
248 WINED3D_SM5_OP_GATHER4_PO_C
= 0x80,
249 WINED3D_SM5_OP_RCP
= 0x81,
250 WINED3D_SM5_OP_F32TOF16
= 0x82,
251 WINED3D_SM5_OP_F16TOF32
= 0x83,
252 WINED3D_SM5_OP_COUNTBITS
= 0x86,
253 WINED3D_SM5_OP_FIRSTBIT_HI
= 0x87,
254 WINED3D_SM5_OP_FIRSTBIT_LO
= 0x88,
255 WINED3D_SM5_OP_FIRSTBIT_SHI
= 0x89,
256 WINED3D_SM5_OP_UBFE
= 0x8a,
257 WINED3D_SM5_OP_IBFE
= 0x8b,
258 WINED3D_SM5_OP_BFI
= 0x8c,
259 WINED3D_SM5_OP_BFREV
= 0x8d,
260 WINED3D_SM5_OP_SWAPC
= 0x8e,
261 WINED3D_SM5_OP_DCL_STREAM
= 0x8f,
262 WINED3D_SM5_OP_DCL_FUNCTION_BODY
= 0x90,
263 WINED3D_SM5_OP_DCL_FUNCTION_TABLE
= 0x91,
264 WINED3D_SM5_OP_DCL_INTERFACE
= 0x92,
265 WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT
= 0x93,
266 WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT
= 0x94,
267 WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN
= 0x95,
268 WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING
= 0x96,
269 WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE
= 0x97,
270 WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR
= 0x98,
271 WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT
= 0x99,
272 WINED3D_SM5_OP_DCL_HS_JOIN_PHASE_INSTANCE_COUNT
= 0x9a,
273 WINED3D_SM5_OP_DCL_THREAD_GROUP
= 0x9b,
274 WINED3D_SM5_OP_DCL_UAV_TYPED
= 0x9c,
275 WINED3D_SM5_OP_DCL_UAV_RAW
= 0x9d,
276 WINED3D_SM5_OP_DCL_UAV_STRUCTURED
= 0x9e,
277 WINED3D_SM5_OP_DCL_TGSM_RAW
= 0x9f,
278 WINED3D_SM5_OP_DCL_TGSM_STRUCTURED
= 0xa0,
279 WINED3D_SM5_OP_DCL_RESOURCE_RAW
= 0xa1,
280 WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED
= 0xa2,
281 WINED3D_SM5_OP_LD_UAV_TYPED
= 0xa3,
282 WINED3D_SM5_OP_STORE_UAV_TYPED
= 0xa4,
283 WINED3D_SM5_OP_LD_RAW
= 0xa5,
284 WINED3D_SM5_OP_STORE_RAW
= 0xa6,
285 WINED3D_SM5_OP_LD_STRUCTURED
= 0xa7,
286 WINED3D_SM5_OP_STORE_STRUCTURED
= 0xa8,
287 WINED3D_SM5_OP_ATOMIC_AND
= 0xa9,
288 WINED3D_SM5_OP_ATOMIC_OR
= 0xaa,
289 WINED3D_SM5_OP_ATOMIC_XOR
= 0xab,
290 WINED3D_SM5_OP_ATOMIC_CMP_STORE
= 0xac,
291 WINED3D_SM5_OP_ATOMIC_IADD
= 0xad,
292 WINED3D_SM5_OP_ATOMIC_IMAX
= 0xae,
293 WINED3D_SM5_OP_ATOMIC_IMIN
= 0xaf,
294 WINED3D_SM5_OP_ATOMIC_UMAX
= 0xb0,
295 WINED3D_SM5_OP_ATOMIC_UMIN
= 0xb1,
296 WINED3D_SM5_OP_IMM_ATOMIC_ALLOC
= 0xb2,
297 WINED3D_SM5_OP_IMM_ATOMIC_CONSUME
= 0xb3,
298 WINED3D_SM5_OP_IMM_ATOMIC_IADD
= 0xb4,
299 WINED3D_SM5_OP_IMM_ATOMIC_AND
= 0xb5,
300 WINED3D_SM5_OP_IMM_ATOMIC_OR
= 0xb6,
301 WINED3D_SM5_OP_IMM_ATOMIC_XOR
= 0xb7,
302 WINED3D_SM5_OP_IMM_ATOMIC_EXCH
= 0xb8,
303 WINED3D_SM5_OP_IMM_ATOMIC_CMP_EXCH
= 0xb9,
304 WINED3D_SM5_OP_IMM_ATOMIC_IMAX
= 0xba,
305 WINED3D_SM5_OP_IMM_ATOMIC_IMIN
= 0xbb,
306 WINED3D_SM5_OP_IMM_ATOMIC_UMAX
= 0xbc,
307 WINED3D_SM5_OP_IMM_ATOMIC_UMIN
= 0xbd,
308 WINED3D_SM5_OP_SYNC
= 0xbe,
309 WINED3D_SM5_OP_EVAL_SAMPLE_INDEX
= 0xcc,
310 WINED3D_SM5_OP_DCL_GS_INSTANCES
= 0xce,
313 enum wined3d_sm4_instruction_modifier
315 WINED3D_SM4_MODIFIER_AOFFIMMI
= 0x1,
316 WINED3D_SM5_MODIFIER_RESOURCE_TYPE
= 0x2,
317 WINED3D_SM5_MODIFIER_DATA_TYPE
= 0x3,
320 enum wined3d_sm4_register_type
322 WINED3D_SM4_RT_TEMP
= 0x00,
323 WINED3D_SM4_RT_INPUT
= 0x01,
324 WINED3D_SM4_RT_OUTPUT
= 0x02,
325 WINED3D_SM4_RT_INDEXABLE_TEMP
= 0x03,
326 WINED3D_SM4_RT_IMMCONST
= 0x04,
327 WINED3D_SM4_RT_SAMPLER
= 0x06,
328 WINED3D_SM4_RT_RESOURCE
= 0x07,
329 WINED3D_SM4_RT_CONSTBUFFER
= 0x08,
330 WINED3D_SM4_RT_IMMCONSTBUFFER
= 0x09,
331 WINED3D_SM4_RT_PRIMID
= 0x0b,
332 WINED3D_SM4_RT_DEPTHOUT
= 0x0c,
333 WINED3D_SM4_RT_NULL
= 0x0d,
334 WINED3D_SM4_RT_RASTERIZER
= 0x0e,
335 WINED3D_SM4_RT_OMASK
= 0x0f,
336 WINED3D_SM5_RT_STREAM
= 0x10,
337 WINED3D_SM5_RT_FUNCTION_BODY
= 0x11,
338 WINED3D_SM5_RT_FUNCTION_POINTER
= 0x13,
339 WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID
= 0x16,
340 WINED3D_SM5_RT_FORK_INSTANCE_ID
= 0x17,
341 WINED3D_SM5_RT_JOIN_INSTANCE_ID
= 0x18,
342 WINED3D_SM5_RT_INPUT_CONTROL_POINT
= 0x19,
343 WINED3D_SM5_RT_OUTPUT_CONTROL_POINT
= 0x1a,
344 WINED3D_SM5_RT_PATCH_CONSTANT_DATA
= 0x1b,
345 WINED3D_SM5_RT_DOMAIN_LOCATION
= 0x1c,
346 WINED3D_SM5_RT_UAV
= 0x1e,
347 WINED3D_SM5_RT_SHARED_MEMORY
= 0x1f,
348 WINED3D_SM5_RT_THREAD_ID
= 0x20,
349 WINED3D_SM5_RT_THREAD_GROUP_ID
= 0x21,
350 WINED3D_SM5_RT_LOCAL_THREAD_ID
= 0x22,
351 WINED3D_SM5_RT_COVERAGE
= 0x23,
352 WINED3D_SM5_RT_LOCAL_THREAD_INDEX
= 0x24,
353 WINED3D_SM5_RT_GS_INSTANCE_ID
= 0x25,
354 WINED3D_SM5_RT_DEPTHOUT_GREATER_EQUAL
= 0x26,
355 WINED3D_SM5_RT_DEPTHOUT_LESS_EQUAL
= 0x27,
358 enum wined3d_sm4_output_primitive_type
360 WINED3D_SM4_OUTPUT_PT_POINTLIST
= 0x1,
361 WINED3D_SM4_OUTPUT_PT_LINESTRIP
= 0x3,
362 WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP
= 0x5,
365 enum wined3d_sm4_input_primitive_type
367 WINED3D_SM4_INPUT_PT_POINT
= 0x01,
368 WINED3D_SM4_INPUT_PT_LINE
= 0x02,
369 WINED3D_SM4_INPUT_PT_TRIANGLE
= 0x03,
370 WINED3D_SM4_INPUT_PT_LINEADJ
= 0x06,
371 WINED3D_SM4_INPUT_PT_TRIANGLEADJ
= 0x07,
372 WINED3D_SM5_INPUT_PT_PATCH1
= 0x08,
373 WINED3D_SM5_INPUT_PT_PATCH2
= 0x09,
374 WINED3D_SM5_INPUT_PT_PATCH3
= 0x0a,
375 WINED3D_SM5_INPUT_PT_PATCH4
= 0x0b,
376 WINED3D_SM5_INPUT_PT_PATCH5
= 0x0c,
377 WINED3D_SM5_INPUT_PT_PATCH6
= 0x0d,
378 WINED3D_SM5_INPUT_PT_PATCH7
= 0x0e,
379 WINED3D_SM5_INPUT_PT_PATCH8
= 0x0f,
380 WINED3D_SM5_INPUT_PT_PATCH9
= 0x10,
381 WINED3D_SM5_INPUT_PT_PATCH10
= 0x11,
382 WINED3D_SM5_INPUT_PT_PATCH11
= 0x12,
383 WINED3D_SM5_INPUT_PT_PATCH12
= 0x13,
384 WINED3D_SM5_INPUT_PT_PATCH13
= 0x14,
385 WINED3D_SM5_INPUT_PT_PATCH14
= 0x15,
386 WINED3D_SM5_INPUT_PT_PATCH15
= 0x16,
387 WINED3D_SM5_INPUT_PT_PATCH16
= 0x17,
388 WINED3D_SM5_INPUT_PT_PATCH17
= 0x18,
389 WINED3D_SM5_INPUT_PT_PATCH18
= 0x19,
390 WINED3D_SM5_INPUT_PT_PATCH19
= 0x1a,
391 WINED3D_SM5_INPUT_PT_PATCH20
= 0x1b,
392 WINED3D_SM5_INPUT_PT_PATCH21
= 0x1c,
393 WINED3D_SM5_INPUT_PT_PATCH22
= 0x1d,
394 WINED3D_SM5_INPUT_PT_PATCH23
= 0x1e,
395 WINED3D_SM5_INPUT_PT_PATCH24
= 0x1f,
396 WINED3D_SM5_INPUT_PT_PATCH25
= 0x20,
397 WINED3D_SM5_INPUT_PT_PATCH26
= 0x21,
398 WINED3D_SM5_INPUT_PT_PATCH27
= 0x22,
399 WINED3D_SM5_INPUT_PT_PATCH28
= 0x23,
400 WINED3D_SM5_INPUT_PT_PATCH29
= 0x24,
401 WINED3D_SM5_INPUT_PT_PATCH30
= 0x25,
402 WINED3D_SM5_INPUT_PT_PATCH31
= 0x26,
403 WINED3D_SM5_INPUT_PT_PATCH32
= 0x27,
406 enum wined3d_sm4_swizzle_type
408 WINED3D_SM4_SWIZZLE_NONE
= 0x0,
409 WINED3D_SM4_SWIZZLE_VEC4
= 0x1,
410 WINED3D_SM4_SWIZZLE_SCALAR
= 0x2,
413 enum wined3d_sm4_dimension
415 WINED3D_SM4_DIMENSION_SCALAR
= 0x1,
416 WINED3D_SM4_DIMENSION_VEC4
= 0x2,
419 enum wined3d_sm4_resource_type
421 WINED3D_SM4_RESOURCE_BUFFER
= 0x1,
422 WINED3D_SM4_RESOURCE_TEXTURE_1D
= 0x2,
423 WINED3D_SM4_RESOURCE_TEXTURE_2D
= 0x3,
424 WINED3D_SM4_RESOURCE_TEXTURE_2DMS
= 0x4,
425 WINED3D_SM4_RESOURCE_TEXTURE_3D
= 0x5,
426 WINED3D_SM4_RESOURCE_TEXTURE_CUBE
= 0x6,
427 WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY
= 0x7,
428 WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY
= 0x8,
429 WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY
= 0x9,
430 WINED3D_SM4_RESOURCE_TEXTURE_CUBEARRAY
= 0xa,
433 enum wined3d_sm4_data_type
435 WINED3D_SM4_DATA_UNORM
= 0x1,
436 WINED3D_SM4_DATA_SNORM
= 0x2,
437 WINED3D_SM4_DATA_INT
= 0x3,
438 WINED3D_SM4_DATA_UINT
= 0x4,
439 WINED3D_SM4_DATA_FLOAT
= 0x5,
442 enum wined3d_sm4_sampler_mode
444 WINED3D_SM4_SAMPLER_DEFAULT
= 0x0,
445 WINED3D_SM4_SAMPLER_COMPARISON
= 0x1,
448 enum wined3d_sm4_shader_data_type
450 WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER
= 0x3,
451 WINED3D_SM4_SHADER_DATA_MESSAGE
= 0x4,
454 struct wined3d_shader_src_param_entry
457 struct wined3d_shader_src_param param
;
460 struct wined3d_sm4_data
462 struct wined3d_shader_version shader_version
;
463 const DWORD
*start
, *end
;
465 unsigned int output_map
[MAX_REG_OUTPUT
];
467 struct wined3d_shader_src_param src_param
[5];
468 struct wined3d_shader_dst_param dst_param
[2];
469 struct list src_free
;
471 struct wined3d_shader_immediate_constant_buffer icb
;
474 struct wined3d_sm4_opcode_info
476 enum wined3d_sm4_opcode opcode
;
477 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx
;
478 const char *dst_info
;
479 const char *src_info
;
480 void (*read_opcode_func
)(struct wined3d_shader_instruction
*ins
,
481 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
482 struct wined3d_sm4_data
*priv
);
485 static const enum wined3d_primitive_type output_primitive_type_table
[] =
487 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
488 /* WINED3D_SM4_OUTPUT_PT_POINTLIST */ WINED3D_PT_POINTLIST
,
489 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
490 /* WINED3D_SM4_OUTPUT_PT_LINESTRIP */ WINED3D_PT_LINESTRIP
,
491 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
492 /* WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP */ WINED3D_PT_TRIANGLESTRIP
,
495 static const enum wined3d_primitive_type input_primitive_type_table
[] =
497 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
498 /* WINED3D_SM4_INPUT_PT_POINT */ WINED3D_PT_POINTLIST
,
499 /* WINED3D_SM4_INPUT_PT_LINE */ WINED3D_PT_LINELIST
,
500 /* WINED3D_SM4_INPUT_PT_TRIANGLE */ WINED3D_PT_TRIANGLELIST
,
501 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
502 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
503 /* WINED3D_SM4_INPUT_PT_LINEADJ */ WINED3D_PT_LINELIST_ADJ
,
504 /* WINED3D_SM4_INPUT_PT_TRIANGLEADJ */ WINED3D_PT_TRIANGLELIST_ADJ
,
507 static const enum wined3d_shader_resource_type resource_type_table
[] =
509 /* 0 */ WINED3D_SHADER_RESOURCE_NONE
,
510 /* WINED3D_SM4_RESOURCE_BUFFER */ WINED3D_SHADER_RESOURCE_BUFFER
,
511 /* WINED3D_SM4_RESOURCE_TEXTURE_1D */ WINED3D_SHADER_RESOURCE_TEXTURE_1D
,
512 /* WINED3D_SM4_RESOURCE_TEXTURE_2D */ WINED3D_SHADER_RESOURCE_TEXTURE_2D
,
513 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMS */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMS
,
514 /* WINED3D_SM4_RESOURCE_TEXTURE_3D */ WINED3D_SHADER_RESOURCE_TEXTURE_3D
,
515 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBE */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBE
,
516 /* WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_1DARRAY
,
517 /* WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DARRAY
,
518 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY
,
519 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBEARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBEARRAY
,
522 static const enum wined3d_data_type data_type_table
[] =
524 /* 0 */ WINED3D_DATA_FLOAT
,
525 /* WINED3D_SM4_DATA_UNORM */ WINED3D_DATA_UNORM
,
526 /* WINED3D_SM4_DATA_SNORM */ WINED3D_DATA_SNORM
,
527 /* WINED3D_SM4_DATA_INT */ WINED3D_DATA_INT
,
528 /* WINED3D_SM4_DATA_UINT */ WINED3D_DATA_UINT
,
529 /* WINED3D_SM4_DATA_FLOAT */ WINED3D_DATA_FLOAT
,
532 static BOOL
shader_sm4_read_src_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
, const DWORD
*end
,
533 enum wined3d_data_type data_type
, struct wined3d_shader_src_param
*src_param
);
534 static BOOL
shader_sm4_read_dst_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
, const DWORD
*end
,
535 enum wined3d_data_type data_type
, struct wined3d_shader_dst_param
*dst_param
);
537 static void shader_sm4_read_conditional_op(struct wined3d_shader_instruction
*ins
,
538 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
539 struct wined3d_sm4_data
*priv
)
541 shader_sm4_read_src_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_UINT
, &priv
->src_param
[0]);
542 ins
->flags
= (opcode_token
& WINED3D_SM4_CONDITIONAL_NZ
) ?
543 WINED3D_SHADER_CONDITIONAL_OP_NZ
: WINED3D_SHADER_CONDITIONAL_OP_Z
;
546 static void shader_sm4_read_shader_data(struct wined3d_shader_instruction
*ins
,
547 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
548 struct wined3d_sm4_data
*priv
)
550 enum wined3d_sm4_shader_data_type type
;
551 unsigned int icb_size
;
553 type
= (opcode_token
& WINED3D_SM4_SHADER_DATA_TYPE_MASK
) >> WINED3D_SM4_SHADER_DATA_TYPE_SHIFT
;
554 if (type
!= WINED3D_SM4_SHADER_DATA_IMMEDIATE_CONSTANT_BUFFER
)
556 FIXME("Ignoring shader data type %#x.\n", type
);
557 ins
->handler_idx
= WINED3DSIH_NOP
;
562 icb_size
= token_count
- 1;
563 if (icb_size
% 4 || icb_size
> MAX_IMMEDIATE_CONSTANT_BUFFER_SIZE
)
565 FIXME("Unexpected immediate constant buffer size %u.\n", icb_size
);
566 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
570 priv
->icb
.vec4_count
= icb_size
/ 4;
571 memcpy(priv
->icb
.data
, tokens
, sizeof(*tokens
) * icb_size
);
572 ins
->declaration
.icb
= &priv
->icb
;
575 static void shader_sm4_read_dcl_resource(struct wined3d_shader_instruction
*ins
,
576 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
577 struct wined3d_sm4_data
*priv
)
579 enum wined3d_sm4_resource_type resource_type
;
580 enum wined3d_sm4_data_type data_type
;
581 enum wined3d_data_type reg_data_type
;
584 resource_type
= (opcode_token
& WINED3D_SM4_RESOURCE_TYPE_MASK
) >> WINED3D_SM4_RESOURCE_TYPE_SHIFT
;
585 if (!resource_type
|| (resource_type
>= ARRAY_SIZE(resource_type_table
)))
587 FIXME("Unhandled resource type %#x.\n", resource_type
);
588 ins
->declaration
.semantic
.resource_type
= WINED3D_SHADER_RESOURCE_NONE
;
592 ins
->declaration
.semantic
.resource_type
= resource_type_table
[resource_type
];
594 reg_data_type
= opcode
== WINED3D_SM4_OP_DCL_RESOURCE
? WINED3D_DATA_RESOURCE
: WINED3D_DATA_UAV
;
595 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], reg_data_type
, &ins
->declaration
.semantic
.reg
);
597 components
= *tokens
++;
598 if ((components
& 0xfff0) != (components
& 0xf) * 0x1110)
599 FIXME("Components (%#x) have different data types.\n", components
);
600 data_type
= components
& 0xf;
602 if (!data_type
|| (data_type
>= ARRAY_SIZE(data_type_table
)))
604 FIXME("Unhandled data type %#x.\n", data_type
);
605 ins
->declaration
.semantic
.resource_data_type
= WINED3D_DATA_FLOAT
;
609 ins
->declaration
.semantic
.resource_data_type
= data_type_table
[data_type
];
612 if (reg_data_type
== WINED3D_DATA_UAV
)
613 ins
->flags
= (opcode_token
& WINED3D_SM5_UAV_FLAGS_MASK
) >> WINED3D_SM5_UAV_FLAGS_SHIFT
;
616 static void shader_sm4_read_dcl_constant_buffer(struct wined3d_shader_instruction
*ins
,
617 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
618 struct wined3d_sm4_data
*priv
)
620 shader_sm4_read_src_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_FLOAT
, &ins
->declaration
.src
);
621 if (opcode_token
& WINED3D_SM4_INDEX_TYPE_MASK
)
622 ins
->flags
|= WINED3DSI_INDEXED_DYNAMIC
;
625 static void shader_sm4_read_dcl_sampler(struct wined3d_shader_instruction
*ins
,
626 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
627 struct wined3d_sm4_data
*priv
)
629 ins
->flags
= (opcode_token
& WINED3D_SM4_SAMPLER_MODE_MASK
) >> WINED3D_SM4_SAMPLER_MODE_SHIFT
;
630 if (ins
->flags
& ~WINED3D_SM4_SAMPLER_COMPARISON
)
631 FIXME("Unhandled sampler mode %#x.\n", ins
->flags
);
632 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_SAMPLER
, &ins
->declaration
.dst
);
635 static void shader_sm4_read_dcl_index_range(struct wined3d_shader_instruction
*ins
,
636 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
637 struct wined3d_sm4_data
*priv
)
639 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_OPAQUE
,
640 &ins
->declaration
.index_range
.first_register
);
641 ins
->declaration
.index_range
.last_register
= *tokens
;
644 static void shader_sm4_read_dcl_output_topology(struct wined3d_shader_instruction
*ins
,
645 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
646 struct wined3d_sm4_data
*priv
)
648 enum wined3d_sm4_output_primitive_type primitive_type
;
650 primitive_type
= (opcode_token
& WINED3D_SM4_PRIMITIVE_TYPE_MASK
) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT
;
651 if (primitive_type
>= ARRAY_SIZE(output_primitive_type_table
))
652 ins
->declaration
.primitive_type
.type
= WINED3D_PT_UNDEFINED
;
654 ins
->declaration
.primitive_type
.type
= output_primitive_type_table
[primitive_type
];
656 if (ins
->declaration
.primitive_type
.type
== WINED3D_PT_UNDEFINED
)
657 FIXME("Unhandled output primitive type %#x.\n", primitive_type
);
660 static void shader_sm4_read_dcl_input_primitive(struct wined3d_shader_instruction
*ins
,
661 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
662 struct wined3d_sm4_data
*priv
)
664 enum wined3d_sm4_input_primitive_type primitive_type
;
666 primitive_type
= (opcode_token
& WINED3D_SM4_PRIMITIVE_TYPE_MASK
) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT
;
667 if (WINED3D_SM5_INPUT_PT_PATCH1
<= primitive_type
&& primitive_type
<= WINED3D_SM5_INPUT_PT_PATCH32
)
669 ins
->declaration
.primitive_type
.type
= WINED3D_PT_PATCH
;
670 ins
->declaration
.primitive_type
.patch_vertex_count
= primitive_type
- WINED3D_SM5_INPUT_PT_PATCH1
+ 1;
672 else if (primitive_type
>= ARRAY_SIZE(input_primitive_type_table
))
674 ins
->declaration
.primitive_type
.type
= WINED3D_PT_UNDEFINED
;
678 ins
->declaration
.primitive_type
.type
= input_primitive_type_table
[primitive_type
];
681 if (ins
->declaration
.primitive_type
.type
== WINED3D_PT_UNDEFINED
)
682 FIXME("Unhandled input primitive type %#x.\n", primitive_type
);
685 static void shader_sm4_read_declaration_count(struct wined3d_shader_instruction
*ins
,
686 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
687 struct wined3d_sm4_data
*priv
)
689 ins
->declaration
.count
= *tokens
;
692 static void shader_sm4_read_declaration_dst(struct wined3d_shader_instruction
*ins
,
693 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
694 struct wined3d_sm4_data
*priv
)
696 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_FLOAT
, &ins
->declaration
.dst
);
699 static void shader_sm4_read_declaration_register_semantic(struct wined3d_shader_instruction
*ins
,
700 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
701 struct wined3d_sm4_data
*priv
)
703 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_FLOAT
,
704 &ins
->declaration
.register_semantic
.reg
);
705 ins
->declaration
.register_semantic
.sysval_semantic
= *tokens
;
708 static void shader_sm4_read_dcl_input_ps(struct wined3d_shader_instruction
*ins
,
709 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
710 struct wined3d_sm4_data
*priv
)
712 ins
->flags
= (opcode_token
& WINED3D_SM4_INTERPOLATION_MODE_MASK
) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT
;
713 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_FLOAT
, &ins
->declaration
.dst
);
716 static void shader_sm4_read_dcl_input_ps_siv(struct wined3d_shader_instruction
*ins
,
717 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
718 struct wined3d_sm4_data
*priv
)
720 ins
->flags
= (opcode_token
& WINED3D_SM4_INTERPOLATION_MODE_MASK
) >> WINED3D_SM4_INTERPOLATION_MODE_SHIFT
;
721 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_FLOAT
,
722 &ins
->declaration
.register_semantic
.reg
);
723 ins
->declaration
.register_semantic
.sysval_semantic
= *tokens
;
726 static void shader_sm4_read_dcl_indexable_temp(struct wined3d_shader_instruction
*ins
,
727 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
728 struct wined3d_sm4_data
*priv
)
730 ins
->declaration
.indexable_temp
.register_idx
= *tokens
++;
731 ins
->declaration
.indexable_temp
.register_size
= *tokens
++;
732 ins
->declaration
.indexable_temp
.component_count
= *tokens
;
735 static void shader_sm4_read_dcl_global_flags(struct wined3d_shader_instruction
*ins
,
736 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
737 struct wined3d_sm4_data
*priv
)
739 ins
->flags
= (opcode_token
& WINED3D_SM4_GLOBAL_FLAGS_MASK
) >> WINED3D_SM4_GLOBAL_FLAGS_SHIFT
;
742 static void shader_sm5_read_fcall(struct wined3d_shader_instruction
*ins
,
743 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
744 struct wined3d_sm4_data
*priv
)
746 priv
->src_param
[0].reg
.u
.fp_body_idx
= *tokens
++;
747 shader_sm4_read_src_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_OPAQUE
, &priv
->src_param
[0]);
750 static void shader_sm5_read_dcl_function_body(struct wined3d_shader_instruction
*ins
,
751 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
752 struct wined3d_sm4_data
*priv
)
754 ins
->declaration
.index
= *tokens
;
757 static void shader_sm5_read_dcl_function_table(struct wined3d_shader_instruction
*ins
,
758 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
759 struct wined3d_sm4_data
*priv
)
761 ins
->declaration
.index
= *tokens
++;
762 FIXME("Ignoring set of function bodies (count %u).\n", *tokens
);
765 static void shader_sm5_read_dcl_interface(struct wined3d_shader_instruction
*ins
,
766 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
767 struct wined3d_sm4_data
*priv
)
769 ins
->declaration
.fp
.index
= *tokens
++;
770 ins
->declaration
.fp
.body_count
= *tokens
++;
771 ins
->declaration
.fp
.array_size
= *tokens
>> WINED3D_SM5_FP_ARRAY_SIZE_SHIFT
;
772 ins
->declaration
.fp
.table_count
= *tokens
++ & WINED3D_SM5_FP_TABLE_COUNT_MASK
;
773 FIXME("Ignoring set of function tables (count %u).\n", ins
->declaration
.fp
.table_count
);
776 static void shader_sm5_read_control_point_count(struct wined3d_shader_instruction
*ins
,
777 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
778 struct wined3d_sm4_data
*priv
)
780 ins
->declaration
.count
= (opcode_token
& WINED3D_SM5_CONTROL_POINT_COUNT_MASK
)
781 >> WINED3D_SM5_CONTROL_POINT_COUNT_SHIFT
;
784 static void shader_sm5_read_dcl_tessellator_domain(struct wined3d_shader_instruction
*ins
,
785 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
786 struct wined3d_sm4_data
*priv
)
788 ins
->declaration
.tessellator_domain
= (opcode_token
& WINED3D_SM5_TESSELLATOR_MASK
)
789 >> WINED3D_SM5_TESSELLATOR_SHIFT
;
792 static void shader_sm5_read_dcl_tessellator_partitioning(struct wined3d_shader_instruction
*ins
,
793 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
794 struct wined3d_sm4_data
*priv
)
796 ins
->declaration
.tessellator_partitioning
= (opcode_token
& WINED3D_SM5_TESSELLATOR_MASK
)
797 >> WINED3D_SM5_TESSELLATOR_SHIFT
;
800 static void shader_sm5_read_dcl_tessellator_output_primitive(struct wined3d_shader_instruction
*ins
,
801 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
802 struct wined3d_sm4_data
*priv
)
804 ins
->declaration
.tessellator_output_primitive
= (opcode_token
& WINED3D_SM5_TESSELLATOR_MASK
)
805 >> WINED3D_SM5_TESSELLATOR_SHIFT
;
808 static void shader_sm5_read_dcl_hs_max_tessfactor(struct wined3d_shader_instruction
*ins
,
809 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
810 struct wined3d_sm4_data
*priv
)
812 ins
->declaration
.max_tessellation_factor
= *(float *)tokens
;
815 static void shader_sm5_read_dcl_thread_group(struct wined3d_shader_instruction
*ins
,
816 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
817 struct wined3d_sm4_data
*priv
)
819 ins
->declaration
.thread_group_size
.x
= *tokens
++;
820 ins
->declaration
.thread_group_size
.y
= *tokens
++;
821 ins
->declaration
.thread_group_size
.z
= *tokens
++;
824 static void shader_sm5_read_dcl_uav_raw(struct wined3d_shader_instruction
*ins
,
825 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
826 struct wined3d_sm4_data
*priv
)
828 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_UAV
, &ins
->declaration
.dst
);
829 ins
->flags
= (opcode_token
& WINED3D_SM5_UAV_FLAGS_MASK
) >> WINED3D_SM5_UAV_FLAGS_SHIFT
;
832 static void shader_sm5_read_dcl_uav_structured(struct wined3d_shader_instruction
*ins
,
833 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
834 struct wined3d_sm4_data
*priv
)
836 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_UAV
,
837 &ins
->declaration
.structured_resource
.reg
);
838 ins
->flags
= (opcode_token
& WINED3D_SM5_UAV_FLAGS_MASK
) >> WINED3D_SM5_UAV_FLAGS_SHIFT
;
839 ins
->declaration
.structured_resource
.byte_stride
= *tokens
;
840 if (ins
->declaration
.structured_resource
.byte_stride
% 4)
841 FIXME("Byte stride %u is not multiple of 4.\n", ins
->declaration
.structured_resource
.byte_stride
);
844 static void shader_sm5_read_dcl_tgsm_raw(struct wined3d_shader_instruction
*ins
,
845 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
846 struct wined3d_sm4_data
*priv
)
848 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_FLOAT
, &ins
->declaration
.tgsm_raw
.reg
);
849 ins
->declaration
.tgsm_raw
.byte_count
= *tokens
;
850 if (ins
->declaration
.tgsm_raw
.byte_count
% 4)
851 FIXME("Byte count %u is not multiple of 4.\n", ins
->declaration
.tgsm_raw
.byte_count
);
854 static void shader_sm5_read_dcl_tgsm_structured(struct wined3d_shader_instruction
*ins
,
855 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
856 struct wined3d_sm4_data
*priv
)
858 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_FLOAT
,
859 &ins
->declaration
.tgsm_structured
.reg
);
860 ins
->declaration
.tgsm_structured
.byte_stride
= *tokens
++;
861 ins
->declaration
.tgsm_structured
.structure_count
= *tokens
;
862 if (ins
->declaration
.tgsm_structured
.byte_stride
% 4)
863 FIXME("Byte stride %u is not multiple of 4.\n", ins
->declaration
.tgsm_structured
.byte_stride
);
866 static void shader_sm5_read_dcl_resource_structured(struct wined3d_shader_instruction
*ins
,
867 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
868 struct wined3d_sm4_data
*priv
)
870 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_RESOURCE
,
871 &ins
->declaration
.structured_resource
.reg
);
872 ins
->declaration
.structured_resource
.byte_stride
= *tokens
;
873 if (ins
->declaration
.structured_resource
.byte_stride
% 4)
874 FIXME("Byte stride %u is not multiple of 4.\n", ins
->declaration
.structured_resource
.byte_stride
);
877 static void shader_sm5_read_dcl_resource_raw(struct wined3d_shader_instruction
*ins
,
878 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
879 struct wined3d_sm4_data
*priv
)
881 shader_sm4_read_dst_param(priv
, &tokens
, &tokens
[token_count
], WINED3D_DATA_RESOURCE
, &ins
->declaration
.dst
);
884 static void shader_sm5_read_sync(struct wined3d_shader_instruction
*ins
,
885 DWORD opcode
, DWORD opcode_token
, const DWORD
*tokens
, unsigned int token_count
,
886 struct wined3d_sm4_data
*priv
)
888 ins
->flags
= (opcode_token
& WINED3D_SM5_SYNC_FLAGS_MASK
) >> WINED3D_SM5_SYNC_FLAGS_SHIFT
;
892 * f -> WINED3D_DATA_FLOAT
893 * i -> WINED3D_DATA_INT
894 * u -> WINED3D_DATA_UINT
895 * O -> WINED3D_DATA_OPAQUE
896 * R -> WINED3D_DATA_RESOURCE
897 * S -> WINED3D_DATA_SAMPLER
898 * U -> WINED3D_DATA_UAV
900 static const struct wined3d_sm4_opcode_info opcode_table
[] =
902 {WINED3D_SM4_OP_ADD
, WINED3DSIH_ADD
, "f", "ff"},
903 {WINED3D_SM4_OP_AND
, WINED3DSIH_AND
, "u", "uu"},
904 {WINED3D_SM4_OP_BREAK
, WINED3DSIH_BREAK
, "", ""},
905 {WINED3D_SM4_OP_BREAKC
, WINED3DSIH_BREAKP
, "", "u",
906 shader_sm4_read_conditional_op
},
907 {WINED3D_SM4_OP_CASE
, WINED3DSIH_CASE
, "", "u"},
908 {WINED3D_SM4_OP_CONTINUE
, WINED3DSIH_CONTINUE
, "", ""},
909 {WINED3D_SM4_OP_CONTINUEC
, WINED3DSIH_CONTINUEP
, "", "u",
910 shader_sm4_read_conditional_op
},
911 {WINED3D_SM4_OP_CUT
, WINED3DSIH_CUT
, "", ""},
912 {WINED3D_SM4_OP_DEFAULT
, WINED3DSIH_DEFAULT
, "", ""},
913 {WINED3D_SM4_OP_DERIV_RTX
, WINED3DSIH_DSX
, "f", "f"},
914 {WINED3D_SM4_OP_DERIV_RTY
, WINED3DSIH_DSY
, "f", "f"},
915 {WINED3D_SM4_OP_DISCARD
, WINED3DSIH_TEXKILL
, "", "u",
916 shader_sm4_read_conditional_op
},
917 {WINED3D_SM4_OP_DIV
, WINED3DSIH_DIV
, "f", "ff"},
918 {WINED3D_SM4_OP_DP2
, WINED3DSIH_DP2
, "f", "ff"},
919 {WINED3D_SM4_OP_DP3
, WINED3DSIH_DP3
, "f", "ff"},
920 {WINED3D_SM4_OP_DP4
, WINED3DSIH_DP4
, "f", "ff"},
921 {WINED3D_SM4_OP_ELSE
, WINED3DSIH_ELSE
, "", ""},
922 {WINED3D_SM4_OP_EMIT
, WINED3DSIH_EMIT
, "", ""},
923 {WINED3D_SM4_OP_ENDIF
, WINED3DSIH_ENDIF
, "", ""},
924 {WINED3D_SM4_OP_ENDLOOP
, WINED3DSIH_ENDLOOP
, "", ""},
925 {WINED3D_SM4_OP_ENDSWITCH
, WINED3DSIH_ENDSWITCH
, "", ""},
926 {WINED3D_SM4_OP_EQ
, WINED3DSIH_EQ
, "u", "ff"},
927 {WINED3D_SM4_OP_EXP
, WINED3DSIH_EXP
, "f", "f"},
928 {WINED3D_SM4_OP_FRC
, WINED3DSIH_FRC
, "f", "f"},
929 {WINED3D_SM4_OP_FTOI
, WINED3DSIH_FTOI
, "i", "f"},
930 {WINED3D_SM4_OP_FTOU
, WINED3DSIH_FTOU
, "u", "f"},
931 {WINED3D_SM4_OP_GE
, WINED3DSIH_GE
, "u", "ff"},
932 {WINED3D_SM4_OP_IADD
, WINED3DSIH_IADD
, "i", "ii"},
933 {WINED3D_SM4_OP_IF
, WINED3DSIH_IF
, "", "u",
934 shader_sm4_read_conditional_op
},
935 {WINED3D_SM4_OP_IEQ
, WINED3DSIH_IEQ
, "u", "ii"},
936 {WINED3D_SM4_OP_IGE
, WINED3DSIH_IGE
, "u", "ii"},
937 {WINED3D_SM4_OP_ILT
, WINED3DSIH_ILT
, "u", "ii"},
938 {WINED3D_SM4_OP_IMAD
, WINED3DSIH_IMAD
, "i", "iii"},
939 {WINED3D_SM4_OP_IMAX
, WINED3DSIH_IMAX
, "i", "ii"},
940 {WINED3D_SM4_OP_IMIN
, WINED3DSIH_IMIN
, "i", "ii"},
941 {WINED3D_SM4_OP_IMUL
, WINED3DSIH_IMUL
, "ii", "ii"},
942 {WINED3D_SM4_OP_INE
, WINED3DSIH_INE
, "u", "ii"},
943 {WINED3D_SM4_OP_INEG
, WINED3DSIH_INEG
, "i", "i"},
944 {WINED3D_SM4_OP_ISHL
, WINED3DSIH_ISHL
, "i", "ii"},
945 {WINED3D_SM4_OP_ISHR
, WINED3DSIH_ISHR
, "i", "ii"},
946 {WINED3D_SM4_OP_ITOF
, WINED3DSIH_ITOF
, "f", "i"},
947 {WINED3D_SM4_OP_LABEL
, WINED3DSIH_LABEL
, "", "O"},
948 {WINED3D_SM4_OP_LD
, WINED3DSIH_LD
, "u", "iR"},
949 {WINED3D_SM4_OP_LD2DMS
, WINED3DSIH_LD2DMS
, "u", "iRi"},
950 {WINED3D_SM4_OP_LOG
, WINED3DSIH_LOG
, "f", "f"},
951 {WINED3D_SM4_OP_LOOP
, WINED3DSIH_LOOP
, "", ""},
952 {WINED3D_SM4_OP_LT
, WINED3DSIH_LT
, "u", "ff"},
953 {WINED3D_SM4_OP_MAD
, WINED3DSIH_MAD
, "f", "fff"},
954 {WINED3D_SM4_OP_MIN
, WINED3DSIH_MIN
, "f", "ff"},
955 {WINED3D_SM4_OP_MAX
, WINED3DSIH_MAX
, "f", "ff"},
956 {WINED3D_SM4_OP_SHADER_DATA
, WINED3DSIH_DCL_IMMEDIATE_CONSTANT_BUFFER
, "", "",
957 shader_sm4_read_shader_data
},
958 {WINED3D_SM4_OP_MOV
, WINED3DSIH_MOV
, "f", "f"},
959 {WINED3D_SM4_OP_MOVC
, WINED3DSIH_MOVC
, "f", "uff"},
960 {WINED3D_SM4_OP_MUL
, WINED3DSIH_MUL
, "f", "ff"},
961 {WINED3D_SM4_OP_NE
, WINED3DSIH_NE
, "u", "ff"},
962 {WINED3D_SM4_OP_NOP
, WINED3DSIH_NOP
, "", ""},
963 {WINED3D_SM4_OP_NOT
, WINED3DSIH_NOT
, "u", "u"},
964 {WINED3D_SM4_OP_OR
, WINED3DSIH_OR
, "u", "uu"},
965 {WINED3D_SM4_OP_RESINFO
, WINED3DSIH_RESINFO
, "f", "iR"},
966 {WINED3D_SM4_OP_RET
, WINED3DSIH_RET
, "", ""},
967 {WINED3D_SM4_OP_RETC
, WINED3DSIH_RETP
, "", "u",
968 shader_sm4_read_conditional_op
},
969 {WINED3D_SM4_OP_ROUND_NE
, WINED3DSIH_ROUND_NE
, "f", "f"},
970 {WINED3D_SM4_OP_ROUND_NI
, WINED3DSIH_ROUND_NI
, "f", "f"},
971 {WINED3D_SM4_OP_ROUND_PI
, WINED3DSIH_ROUND_PI
, "f", "f"},
972 {WINED3D_SM4_OP_ROUND_Z
, WINED3DSIH_ROUND_Z
, "f", "f"},
973 {WINED3D_SM4_OP_RSQ
, WINED3DSIH_RSQ
, "f", "f"},
974 {WINED3D_SM4_OP_SAMPLE
, WINED3DSIH_SAMPLE
, "u", "fRS"},
975 {WINED3D_SM4_OP_SAMPLE_C
, WINED3DSIH_SAMPLE_C
, "f", "fRSf"},
976 {WINED3D_SM4_OP_SAMPLE_C_LZ
, WINED3DSIH_SAMPLE_C_LZ
, "f", "fRSf"},
977 {WINED3D_SM4_OP_SAMPLE_LOD
, WINED3DSIH_SAMPLE_LOD
, "u", "fRSf"},
978 {WINED3D_SM4_OP_SAMPLE_GRAD
, WINED3DSIH_SAMPLE_GRAD
, "u", "fRSff"},
979 {WINED3D_SM4_OP_SAMPLE_B
, WINED3DSIH_SAMPLE_B
, "u", "fRSf"},
980 {WINED3D_SM4_OP_SQRT
, WINED3DSIH_SQRT
, "f", "f"},
981 {WINED3D_SM4_OP_SWITCH
, WINED3DSIH_SWITCH
, "", "u"},
982 {WINED3D_SM4_OP_SINCOS
, WINED3DSIH_SINCOS
, "ff", "f"},
983 {WINED3D_SM4_OP_UDIV
, WINED3DSIH_UDIV
, "uu", "uu"},
984 {WINED3D_SM4_OP_ULT
, WINED3DSIH_ULT
, "u", "uu"},
985 {WINED3D_SM4_OP_UGE
, WINED3DSIH_UGE
, "u", "uu"},
986 {WINED3D_SM4_OP_UMUL
, WINED3DSIH_UMUL
, "uu", "uu"},
987 {WINED3D_SM4_OP_UMAX
, WINED3DSIH_UMAX
, "u", "uu"},
988 {WINED3D_SM4_OP_UMIN
, WINED3DSIH_UMIN
, "u", "uu"},
989 {WINED3D_SM4_OP_USHR
, WINED3DSIH_USHR
, "u", "uu"},
990 {WINED3D_SM4_OP_UTOF
, WINED3DSIH_UTOF
, "f", "u"},
991 {WINED3D_SM4_OP_XOR
, WINED3DSIH_XOR
, "u", "uu"},
992 {WINED3D_SM4_OP_DCL_RESOURCE
, WINED3DSIH_DCL
, "R", "",
993 shader_sm4_read_dcl_resource
},
994 {WINED3D_SM4_OP_DCL_CONSTANT_BUFFER
, WINED3DSIH_DCL_CONSTANT_BUFFER
, "", "",
995 shader_sm4_read_dcl_constant_buffer
},
996 {WINED3D_SM4_OP_DCL_SAMPLER
, WINED3DSIH_DCL_SAMPLER
, "", "",
997 shader_sm4_read_dcl_sampler
},
998 {WINED3D_SM4_OP_DCL_INDEX_RANGE
, WINED3DSIH_DCL_INDEX_RANGE
, "", "",
999 shader_sm4_read_dcl_index_range
},
1000 {WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY
, WINED3DSIH_DCL_OUTPUT_TOPOLOGY
, "", "",
1001 shader_sm4_read_dcl_output_topology
},
1002 {WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE
, WINED3DSIH_DCL_INPUT_PRIMITIVE
, "", "",
1003 shader_sm4_read_dcl_input_primitive
},
1004 {WINED3D_SM4_OP_DCL_VERTICES_OUT
, WINED3DSIH_DCL_VERTICES_OUT
, "", "",
1005 shader_sm4_read_declaration_count
},
1006 {WINED3D_SM4_OP_DCL_INPUT
, WINED3DSIH_DCL_INPUT
, "", "",
1007 shader_sm4_read_declaration_dst
},
1008 {WINED3D_SM4_OP_DCL_INPUT_SGV
, WINED3DSIH_DCL_INPUT_SGV
, "", "",
1009 shader_sm4_read_declaration_register_semantic
},
1010 {WINED3D_SM4_OP_DCL_INPUT_SIV
, WINED3DSIH_DCL_INPUT_SIV
, "", "",
1011 shader_sm4_read_declaration_register_semantic
},
1012 {WINED3D_SM4_OP_DCL_INPUT_PS
, WINED3DSIH_DCL_INPUT_PS
, "", "",
1013 shader_sm4_read_dcl_input_ps
},
1014 {WINED3D_SM4_OP_DCL_INPUT_PS_SGV
, WINED3DSIH_DCL_INPUT_PS_SGV
, "", "",
1015 shader_sm4_read_declaration_register_semantic
},
1016 {WINED3D_SM4_OP_DCL_INPUT_PS_SIV
, WINED3DSIH_DCL_INPUT_PS_SIV
, "", "",
1017 shader_sm4_read_dcl_input_ps_siv
},
1018 {WINED3D_SM4_OP_DCL_OUTPUT
, WINED3DSIH_DCL_OUTPUT
, "", "",
1019 shader_sm4_read_declaration_dst
},
1020 {WINED3D_SM4_OP_DCL_OUTPUT_SIV
, WINED3DSIH_DCL_OUTPUT_SIV
, "", "",
1021 shader_sm4_read_declaration_register_semantic
},
1022 {WINED3D_SM4_OP_DCL_TEMPS
, WINED3DSIH_DCL_TEMPS
, "", "",
1023 shader_sm4_read_declaration_count
},
1024 {WINED3D_SM4_OP_DCL_INDEXABLE_TEMP
, WINED3DSIH_DCL_INDEXABLE_TEMP
, "", "",
1025 shader_sm4_read_dcl_indexable_temp
},
1026 {WINED3D_SM4_OP_DCL_GLOBAL_FLAGS
, WINED3DSIH_DCL_GLOBAL_FLAGS
, "", "",
1027 shader_sm4_read_dcl_global_flags
},
1028 {WINED3D_SM4_OP_LOD
, WINED3DSIH_LOD
, "f", "fRS"},
1029 {WINED3D_SM4_OP_GATHER4
, WINED3DSIH_GATHER4
, "u", "fRS"},
1030 {WINED3D_SM4_OP_SAMPLE_POS
, WINED3DSIH_SAMPLE_POS
, "f", "Ru"},
1031 {WINED3D_SM4_OP_SAMPLE_INFO
, WINED3DSIH_SAMPLE_INFO
, "f", "R"},
1032 {WINED3D_SM5_OP_HS_DECLS
, WINED3DSIH_HS_DECLS
, "", ""},
1033 {WINED3D_SM5_OP_HS_CONTROL_POINT_PHASE
, WINED3DSIH_HS_CONTROL_POINT_PHASE
, "", ""},
1034 {WINED3D_SM5_OP_HS_FORK_PHASE
, WINED3DSIH_HS_FORK_PHASE
, "", ""},
1035 {WINED3D_SM5_OP_HS_JOIN_PHASE
, WINED3DSIH_HS_JOIN_PHASE
, "", ""},
1036 {WINED3D_SM5_OP_EMIT_STREAM
, WINED3DSIH_EMIT_STREAM
, "", "f"},
1037 {WINED3D_SM5_OP_CUT_STREAM
, WINED3DSIH_CUT_STREAM
, "", "f"},
1038 {WINED3D_SM5_OP_FCALL
, WINED3DSIH_FCALL
, "", "O",
1039 shader_sm5_read_fcall
},
1040 {WINED3D_SM5_OP_BUFINFO
, WINED3DSIH_BUFINFO
, "i", "U"},
1041 {WINED3D_SM5_OP_DERIV_RTX_COARSE
, WINED3DSIH_DSX_COARSE
, "f", "f"},
1042 {WINED3D_SM5_OP_DERIV_RTX_FINE
, WINED3DSIH_DSX_FINE
, "f", "f"},
1043 {WINED3D_SM5_OP_DERIV_RTY_COARSE
, WINED3DSIH_DSY_COARSE
, "f", "f"},
1044 {WINED3D_SM5_OP_DERIV_RTY_FINE
, WINED3DSIH_DSY_FINE
, "f", "f"},
1045 {WINED3D_SM5_OP_GATHER4_C
, WINED3DSIH_GATHER4_C
, "f", "fRSf"},
1046 {WINED3D_SM5_OP_GATHER4_PO
, WINED3DSIH_GATHER4_PO
, "f", "fiRS"},
1047 {WINED3D_SM5_OP_GATHER4_PO_C
, WINED3DSIH_GATHER4_PO_C
, "f", "fiRSf"},
1048 {WINED3D_SM5_OP_RCP
, WINED3DSIH_RCP
, "f", "f"},
1049 {WINED3D_SM5_OP_F32TOF16
, WINED3DSIH_F32TOF16
, "u", "f"},
1050 {WINED3D_SM5_OP_F16TOF32
, WINED3DSIH_F16TOF32
, "f", "u"},
1051 {WINED3D_SM5_OP_COUNTBITS
, WINED3DSIH_COUNTBITS
, "u", "u"},
1052 {WINED3D_SM5_OP_FIRSTBIT_HI
, WINED3DSIH_FIRSTBIT_HI
, "u", "u"},
1053 {WINED3D_SM5_OP_FIRSTBIT_LO
, WINED3DSIH_FIRSTBIT_LO
, "u", "u"},
1054 {WINED3D_SM5_OP_FIRSTBIT_SHI
, WINED3DSIH_FIRSTBIT_SHI
, "u", "i"},
1055 {WINED3D_SM5_OP_UBFE
, WINED3DSIH_UBFE
, "u", "iiu"},
1056 {WINED3D_SM5_OP_IBFE
, WINED3DSIH_IBFE
, "i", "iii"},
1057 {WINED3D_SM5_OP_BFI
, WINED3DSIH_BFI
, "u", "iiuu"},
1058 {WINED3D_SM5_OP_BFREV
, WINED3DSIH_BFREV
, "u", "u"},
1059 {WINED3D_SM5_OP_SWAPC
, WINED3DSIH_SWAPC
, "ff", "uff"},
1060 {WINED3D_SM5_OP_DCL_STREAM
, WINED3DSIH_DCL_STREAM
, "", "O"},
1061 {WINED3D_SM5_OP_DCL_FUNCTION_BODY
, WINED3DSIH_DCL_FUNCTION_BODY
, "", "",
1062 shader_sm5_read_dcl_function_body
},
1063 {WINED3D_SM5_OP_DCL_FUNCTION_TABLE
, WINED3DSIH_DCL_FUNCTION_TABLE
, "", "",
1064 shader_sm5_read_dcl_function_table
},
1065 {WINED3D_SM5_OP_DCL_INTERFACE
, WINED3DSIH_DCL_INTERFACE
, "", "",
1066 shader_sm5_read_dcl_interface
},
1067 {WINED3D_SM5_OP_DCL_INPUT_CONTROL_POINT_COUNT
, WINED3DSIH_DCL_INPUT_CONTROL_POINT_COUNT
, "", "",
1068 shader_sm5_read_control_point_count
},
1069 {WINED3D_SM5_OP_DCL_OUTPUT_CONTROL_POINT_COUNT
, WINED3DSIH_DCL_OUTPUT_CONTROL_POINT_COUNT
, "", "",
1070 shader_sm5_read_control_point_count
},
1071 {WINED3D_SM5_OP_DCL_TESSELLATOR_DOMAIN
, WINED3DSIH_DCL_TESSELLATOR_DOMAIN
, "", "",
1072 shader_sm5_read_dcl_tessellator_domain
},
1073 {WINED3D_SM5_OP_DCL_TESSELLATOR_PARTITIONING
, WINED3DSIH_DCL_TESSELLATOR_PARTITIONING
, "", "",
1074 shader_sm5_read_dcl_tessellator_partitioning
},
1075 {WINED3D_SM5_OP_DCL_TESSELLATOR_OUTPUT_PRIMITIVE
, WINED3DSIH_DCL_TESSELLATOR_OUTPUT_PRIMITIVE
, "", "",
1076 shader_sm5_read_dcl_tessellator_output_primitive
},
1077 {WINED3D_SM5_OP_DCL_HS_MAX_TESSFACTOR
, WINED3DSIH_DCL_HS_MAX_TESSFACTOR
, "", "",
1078 shader_sm5_read_dcl_hs_max_tessfactor
},
1079 {WINED3D_SM5_OP_DCL_HS_FORK_PHASE_INSTANCE_COUNT
, WINED3DSIH_DCL_HS_FORK_PHASE_INSTANCE_COUNT
, "", "",
1080 shader_sm4_read_declaration_count
},
1081 {WINED3D_SM5_OP_DCL_HS_JOIN_PHASE_INSTANCE_COUNT
, WINED3DSIH_DCL_HS_JOIN_PHASE_INSTANCE_COUNT
, "", "",
1082 shader_sm4_read_declaration_count
},
1083 {WINED3D_SM5_OP_DCL_THREAD_GROUP
, WINED3DSIH_DCL_THREAD_GROUP
, "", "",
1084 shader_sm5_read_dcl_thread_group
},
1085 {WINED3D_SM5_OP_DCL_UAV_TYPED
, WINED3DSIH_DCL_UAV_TYPED
, "", "",
1086 shader_sm4_read_dcl_resource
},
1087 {WINED3D_SM5_OP_DCL_UAV_RAW
, WINED3DSIH_DCL_UAV_RAW
, "", "",
1088 shader_sm5_read_dcl_uav_raw
},
1089 {WINED3D_SM5_OP_DCL_UAV_STRUCTURED
, WINED3DSIH_DCL_UAV_STRUCTURED
, "", "",
1090 shader_sm5_read_dcl_uav_structured
},
1091 {WINED3D_SM5_OP_DCL_TGSM_RAW
, WINED3DSIH_DCL_TGSM_RAW
, "", "",
1092 shader_sm5_read_dcl_tgsm_raw
},
1093 {WINED3D_SM5_OP_DCL_TGSM_STRUCTURED
, WINED3DSIH_DCL_TGSM_STRUCTURED
, "", "",
1094 shader_sm5_read_dcl_tgsm_structured
},
1095 {WINED3D_SM5_OP_DCL_RESOURCE_RAW
, WINED3DSIH_DCL_RESOURCE_RAW
, "", "",
1096 shader_sm5_read_dcl_resource_raw
},
1097 {WINED3D_SM5_OP_DCL_RESOURCE_STRUCTURED
, WINED3DSIH_DCL_RESOURCE_STRUCTURED
, "", "",
1098 shader_sm5_read_dcl_resource_structured
},
1099 {WINED3D_SM5_OP_LD_UAV_TYPED
, WINED3DSIH_LD_UAV_TYPED
, "u", "iU"},
1100 {WINED3D_SM5_OP_STORE_UAV_TYPED
, WINED3DSIH_STORE_UAV_TYPED
, "U", "iu"},
1101 {WINED3D_SM5_OP_LD_RAW
, WINED3DSIH_LD_RAW
, "u", "iU"},
1102 {WINED3D_SM5_OP_STORE_RAW
, WINED3DSIH_STORE_RAW
, "U", "iu"},
1103 {WINED3D_SM5_OP_LD_STRUCTURED
, WINED3DSIH_LD_STRUCTURED
, "u", "iiR"},
1104 {WINED3D_SM5_OP_STORE_STRUCTURED
, WINED3DSIH_STORE_STRUCTURED
, "U", "iiu"},
1105 {WINED3D_SM5_OP_ATOMIC_AND
, WINED3DSIH_ATOMIC_AND
, "U", "iu"},
1106 {WINED3D_SM5_OP_ATOMIC_OR
, WINED3DSIH_ATOMIC_OR
, "U", "iu"},
1107 {WINED3D_SM5_OP_ATOMIC_XOR
, WINED3DSIH_ATOMIC_XOR
, "U", "iu"},
1108 {WINED3D_SM5_OP_ATOMIC_CMP_STORE
, WINED3DSIH_ATOMIC_CMP_STORE
, "U", "iuu"},
1109 {WINED3D_SM5_OP_ATOMIC_IADD
, WINED3DSIH_ATOMIC_IADD
, "U", "ii"},
1110 {WINED3D_SM5_OP_ATOMIC_IMAX
, WINED3DSIH_ATOMIC_IMAX
, "U", "ii"},
1111 {WINED3D_SM5_OP_ATOMIC_IMIN
, WINED3DSIH_ATOMIC_IMIN
, "U", "ii"},
1112 {WINED3D_SM5_OP_ATOMIC_UMAX
, WINED3DSIH_ATOMIC_UMAX
, "U", "iu"},
1113 {WINED3D_SM5_OP_ATOMIC_UMIN
, WINED3DSIH_ATOMIC_UMIN
, "U", "iu"},
1114 {WINED3D_SM5_OP_IMM_ATOMIC_ALLOC
, WINED3DSIH_IMM_ATOMIC_ALLOC
, "u", "U"},
1115 {WINED3D_SM5_OP_IMM_ATOMIC_CONSUME
, WINED3DSIH_IMM_ATOMIC_CONSUME
, "u", "U"},
1116 {WINED3D_SM5_OP_IMM_ATOMIC_IADD
, WINED3DSIH_IMM_ATOMIC_IADD
, "uU", "ii"},
1117 {WINED3D_SM5_OP_IMM_ATOMIC_AND
, WINED3DSIH_IMM_ATOMIC_AND
, "uU", "iu"},
1118 {WINED3D_SM5_OP_IMM_ATOMIC_OR
, WINED3DSIH_IMM_ATOMIC_OR
, "uU", "iu"},
1119 {WINED3D_SM5_OP_IMM_ATOMIC_XOR
, WINED3DSIH_IMM_ATOMIC_XOR
, "uU", "iu"},
1120 {WINED3D_SM5_OP_IMM_ATOMIC_EXCH
, WINED3DSIH_IMM_ATOMIC_EXCH
, "uU", "iu"},
1121 {WINED3D_SM5_OP_IMM_ATOMIC_CMP_EXCH
, WINED3DSIH_IMM_ATOMIC_CMP_EXCH
, "uU", "iuu"},
1122 {WINED3D_SM5_OP_IMM_ATOMIC_IMAX
, WINED3DSIH_IMM_ATOMIC_IMAX
, "iU", "ii"},
1123 {WINED3D_SM5_OP_IMM_ATOMIC_IMIN
, WINED3DSIH_IMM_ATOMIC_IMIN
, "iU", "ii"},
1124 {WINED3D_SM5_OP_IMM_ATOMIC_UMAX
, WINED3DSIH_IMM_ATOMIC_UMAX
, "uU", "iu"},
1125 {WINED3D_SM5_OP_IMM_ATOMIC_UMIN
, WINED3DSIH_IMM_ATOMIC_UMIN
, "uU", "iu"},
1126 {WINED3D_SM5_OP_SYNC
, WINED3DSIH_SYNC
, "", "",
1127 shader_sm5_read_sync
},
1128 {WINED3D_SM5_OP_EVAL_SAMPLE_INDEX
, WINED3DSIH_EVAL_SAMPLE_INDEX
, "f", "fi"},
1129 {WINED3D_SM5_OP_DCL_GS_INSTANCES
, WINED3DSIH_DCL_GS_INSTANCES
, "", "",
1130 shader_sm4_read_declaration_count
},
1133 static const enum wined3d_shader_register_type register_type_table
[] =
1135 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP
,
1136 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT
,
1137 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT
,
1138 /* WINED3D_SM4_RT_INDEXABLE_TEMP */ WINED3DSPR_IDXTEMP
,
1139 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST
,
1141 /* WINED3D_SM4_RT_SAMPLER */ WINED3DSPR_SAMPLER
,
1142 /* WINED3D_SM4_RT_RESOURCE */ WINED3DSPR_RESOURCE
,
1143 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER
,
1144 /* WINED3D_SM4_RT_IMMCONSTBUFFER */ WINED3DSPR_IMMCONSTBUFFER
,
1146 /* WINED3D_SM4_RT_PRIMID */ WINED3DSPR_PRIMID
,
1147 /* WINED3D_SM4_RT_DEPTHOUT */ WINED3DSPR_DEPTHOUT
,
1148 /* WINED3D_SM4_RT_NULL */ WINED3DSPR_NULL
,
1149 /* WINED3D_SM4_RT_RASTERIZER */ WINED3DSPR_RASTERIZER
,
1150 /* WINED3D_SM4_RT_OMASK */ WINED3DSPR_SAMPLEMASK
,
1151 /* WINED3D_SM5_RT_STREAM */ WINED3DSPR_STREAM
,
1152 /* WINED3D_SM5_RT_FUNCTION_BODY */ WINED3DSPR_FUNCTIONBODY
,
1154 /* WINED3D_SM5_RT_FUNCTION_POINTER */ WINED3DSPR_FUNCTIONPOINTER
,
1157 /* WINED3D_SM5_RT_OUTPUT_CONTROL_POINT_ID */ WINED3DSPR_OUTPOINTID
,
1158 /* WINED3D_SM5_RT_FORK_INSTANCE_ID */ WINED3DSPR_FORKINSTID
,
1159 /* WINED3D_SM5_RT_JOIN_INSTANCE_ID */ WINED3DSPR_JOININSTID
,
1160 /* WINED3D_SM5_RT_INPUT_CONTROL_POINT */ WINED3DSPR_INCONTROLPOINT
,
1161 /* WINED3D_SM5_RT_OUTPUT_CONTROL_POINT */ WINED3DSPR_OUTCONTROLPOINT
,
1162 /* WINED3D_SM5_RT_PATCH_CONSTANT_DATA */ WINED3DSPR_PATCHCONST
,
1163 /* WINED3D_SM5_RT_DOMAIN_LOCATION */ WINED3DSPR_TESSCOORD
,
1165 /* WINED3D_SM5_RT_UAV */ WINED3DSPR_UAV
,
1166 /* WINED3D_SM5_RT_SHARED_MEMORY */ WINED3DSPR_GROUPSHAREDMEM
,
1167 /* WINED3D_SM5_RT_THREAD_ID */ WINED3DSPR_THREADID
,
1168 /* WINED3D_SM5_RT_THREAD_GROUP_ID */ WINED3DSPR_THREADGROUPID
,
1169 /* WINED3D_SM5_RT_LOCAL_THREAD_ID */ WINED3DSPR_LOCALTHREADID
,
1170 /* WINED3D_SM5_RT_COVERAGE */ WINED3DSPR_COVERAGE
,
1171 /* WINED3D_SM5_RT_LOCAL_THREAD_INDEX */ WINED3DSPR_LOCALTHREADINDEX
,
1172 /* WINED3D_SM5_RT_GS_INSTANCE_ID */ WINED3DSPR_GSINSTID
,
1173 /* WINED3D_SM5_RT_DEPTHOUT_GREATER_EQUAL */ WINED3DSPR_DEPTHOUTGE
,
1174 /* WINED3D_SM5_RT_DEPTHOUT_LESS_EQUAL */ WINED3DSPR_DEPTHOUTLE
,
1177 static const struct wined3d_sm4_opcode_info
*get_opcode_info(enum wined3d_sm4_opcode opcode
)
1181 for (i
= 0; i
< ARRAY_SIZE(opcode_table
); ++i
)
1183 if (opcode
== opcode_table
[i
].opcode
) return &opcode_table
[i
];
1189 static void map_register(const struct wined3d_sm4_data
*priv
, struct wined3d_shader_register
*reg
)
1191 switch (priv
->shader_version
.type
)
1193 case WINED3D_SHADER_TYPE_PIXEL
:
1194 if (reg
->type
== WINED3DSPR_OUTPUT
)
1196 unsigned int reg_idx
= reg
->idx
[0].offset
;
1198 if (reg_idx
>= ARRAY_SIZE(priv
->output_map
))
1200 ERR("Invalid output index %u.\n", reg_idx
);
1204 reg
->type
= WINED3DSPR_COLOROUT
;
1205 reg
->idx
[0].offset
= priv
->output_map
[reg_idx
];
1214 static enum wined3d_data_type
map_data_type(char t
)
1219 return WINED3D_DATA_FLOAT
;
1221 return WINED3D_DATA_INT
;
1223 return WINED3D_DATA_UINT
;
1225 return WINED3D_DATA_OPAQUE
;
1227 return WINED3D_DATA_RESOURCE
;
1229 return WINED3D_DATA_SAMPLER
;
1231 return WINED3D_DATA_UAV
;
1233 ERR("Invalid data type '%c'.\n", t
);
1234 return WINED3D_DATA_FLOAT
;
1238 static enum wined3d_shader_type
wined3d_get_sm4_shader_type(const DWORD
*byte_code
, size_t byte_code_size
)
1242 if (byte_code_size
/ sizeof(*byte_code
) < 1)
1244 WARN("Invalid byte code size %lu.\n", (long)byte_code_size
);
1245 return WINED3D_SHADER_TYPE_INVALID
;
1248 shader_type
= byte_code
[0] >> 16;
1249 switch (shader_type
)
1251 case WINED3D_SM4_PS
:
1252 return WINED3D_SHADER_TYPE_PIXEL
;
1254 case WINED3D_SM4_VS
:
1255 return WINED3D_SHADER_TYPE_VERTEX
;
1257 case WINED3D_SM4_GS
:
1258 return WINED3D_SHADER_TYPE_GEOMETRY
;
1260 case WINED3D_SM5_HS
:
1261 return WINED3D_SHADER_TYPE_HULL
;
1263 case WINED3D_SM5_DS
:
1264 return WINED3D_SHADER_TYPE_DOMAIN
;
1266 case WINED3D_SM5_CS
:
1267 return WINED3D_SHADER_TYPE_COMPUTE
;
1270 FIXME("Unrecognised shader type %#x.\n", shader_type
);
1271 return WINED3D_SHADER_TYPE_INVALID
;
1275 static void *shader_sm4_init(const DWORD
*byte_code
, size_t byte_code_size
,
1276 const struct wined3d_shader_signature
*output_signature
)
1278 DWORD version_token
, token_count
;
1279 struct wined3d_sm4_data
*priv
;
1282 if (byte_code_size
/ sizeof(*byte_code
) < 2)
1284 WARN("Invalid byte code size %lu.\n", (long)byte_code_size
);
1288 version_token
= byte_code
[0];
1289 TRACE("Version: 0x%08x.\n", version_token
);
1290 token_count
= byte_code
[1];
1291 TRACE("Token count: %u.\n", token_count
);
1293 if (token_count
< 2 || byte_code_size
/ sizeof(*byte_code
) < token_count
)
1295 WARN("Invalid token count %u.\n", token_count
);
1299 if (!(priv
= heap_alloc(sizeof(*priv
))))
1301 ERR("Failed to allocate private data\n");
1305 priv
->start
= &byte_code
[2];
1306 priv
->end
= &byte_code
[token_count
];
1308 priv
->shader_version
.type
= wined3d_get_sm4_shader_type(byte_code
, byte_code_size
);
1309 if (priv
->shader_version
.type
== WINED3D_SHADER_TYPE_INVALID
)
1315 priv
->shader_version
.major
= WINED3D_SM4_VERSION_MAJOR(version_token
);
1316 priv
->shader_version
.minor
= WINED3D_SM4_VERSION_MINOR(version_token
);
1318 memset(priv
->output_map
, 0xff, sizeof(priv
->output_map
));
1319 for (i
= 0; i
< output_signature
->element_count
; ++i
)
1321 struct wined3d_shader_signature_element
*e
= &output_signature
->elements
[i
];
1323 if (e
->register_idx
>= ARRAY_SIZE(priv
->output_map
))
1325 WARN("Invalid output index %u.\n", e
->register_idx
);
1329 priv
->output_map
[e
->register_idx
] = e
->semantic_idx
;
1332 list_init(&priv
->src_free
);
1333 list_init(&priv
->src
);
1338 static void shader_sm4_free(void *data
)
1340 struct wined3d_shader_src_param_entry
*e1
, *e2
;
1341 struct wined3d_sm4_data
*priv
= data
;
1343 list_move_head(&priv
->src_free
, &priv
->src
);
1344 LIST_FOR_EACH_ENTRY_SAFE(e1
, e2
, &priv
->src_free
, struct wined3d_shader_src_param_entry
, entry
)
1351 static struct wined3d_shader_src_param
*get_src_param(struct wined3d_sm4_data
*priv
)
1353 struct wined3d_shader_src_param_entry
*e
;
1356 if (!list_empty(&priv
->src_free
))
1358 elem
= list_head(&priv
->src_free
);
1363 if (!(e
= heap_alloc(sizeof(*e
))))
1368 list_add_tail(&priv
->src
, elem
);
1369 e
= LIST_ENTRY(elem
, struct wined3d_shader_src_param_entry
, entry
);
1373 static void shader_sm4_read_header(void *data
, const DWORD
**ptr
, struct wined3d_shader_version
*shader_version
)
1375 struct wined3d_sm4_data
*priv
= data
;
1378 *shader_version
= priv
->shader_version
;
1381 static BOOL
shader_sm4_read_reg_idx(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
, const DWORD
*end
,
1382 DWORD addressing
, struct wined3d_shader_register_index
*reg_idx
)
1384 if (addressing
& WINED3D_SM4_ADDRESSING_RELATIVE
)
1386 struct wined3d_shader_src_param
*rel_addr
= get_src_param(priv
);
1388 if (!(reg_idx
->rel_addr
= rel_addr
))
1390 ERR("Failed to get src param for relative addressing.\n");
1394 if (addressing
& WINED3D_SM4_ADDRESSING_OFFSET
)
1395 reg_idx
->offset
= *(*ptr
)++;
1397 reg_idx
->offset
= 0;
1398 shader_sm4_read_src_param(priv
, ptr
, end
, WINED3D_DATA_INT
, rel_addr
);
1402 reg_idx
->rel_addr
= NULL
;
1403 reg_idx
->offset
= *(*ptr
)++;
1409 static BOOL
shader_sm4_read_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
, const DWORD
*end
,
1410 enum wined3d_data_type data_type
, struct wined3d_shader_register
*param
,
1411 enum wined3d_shader_src_modifier
*modifier
)
1413 enum wined3d_sm4_register_type register_type
;
1418 WARN("Invalid ptr %p >= end %p.\n", *ptr
, end
);
1423 register_type
= (token
& WINED3D_SM4_REGISTER_TYPE_MASK
) >> WINED3D_SM4_REGISTER_TYPE_SHIFT
;
1424 if (register_type
>= ARRAY_SIZE(register_type_table
)
1425 || register_type_table
[register_type
] == ~0u)
1427 FIXME("Unhandled register type %#x.\n", register_type
);
1428 param
->type
= WINED3DSPR_TEMP
;
1432 param
->type
= register_type_table
[register_type
];
1434 param
->data_type
= data_type
;
1436 if (token
& WINED3D_SM4_REGISTER_MODIFIER
)
1442 WARN("Invalid ptr %p >= end %p.\n", *ptr
, end
);
1450 *modifier
= WINED3DSPSM_NEG
;
1454 *modifier
= WINED3DSPSM_ABS
;
1458 *modifier
= WINED3DSPSM_ABSNEG
;
1462 FIXME("Skipping modifier 0x%08x.\n", m
);
1464 *modifier
= WINED3DSPSM_NONE
;
1470 *modifier
= WINED3DSPSM_NONE
;
1473 order
= (token
& WINED3D_SM4_REGISTER_ORDER_MASK
) >> WINED3D_SM4_REGISTER_ORDER_SHIFT
;
1476 param
->idx
[0].offset
= ~0U;
1479 DWORD addressing
= (token
& WINED3D_SM4_ADDRESSING_MASK0
) >> WINED3D_SM4_ADDRESSING_SHIFT0
;
1480 if (!(shader_sm4_read_reg_idx(priv
, ptr
, end
, addressing
, ¶m
->idx
[0])))
1482 ERR("Failed to read register index.\n");
1488 param
->idx
[1].offset
= ~0U;
1491 DWORD addressing
= (token
& WINED3D_SM4_ADDRESSING_MASK1
) >> WINED3D_SM4_ADDRESSING_SHIFT1
;
1492 if (!(shader_sm4_read_reg_idx(priv
, ptr
, end
, addressing
, ¶m
->idx
[1])))
1494 ERR("Failed to read register index.\n");
1500 FIXME("Unhandled order %u.\n", order
);
1502 if (register_type
== WINED3D_SM4_RT_IMMCONST
)
1504 enum wined3d_sm4_dimension dimension
= (token
& WINED3D_SM4_DIMENSION_MASK
) >> WINED3D_SM4_DIMENSION_SHIFT
;
1508 case WINED3D_SM4_DIMENSION_SCALAR
:
1509 param
->immconst_type
= WINED3D_IMMCONST_SCALAR
;
1512 WARN("Invalid ptr %p, end %p.\n", *ptr
, end
);
1515 memcpy(param
->u
.immconst_data
, *ptr
, 1 * sizeof(DWORD
));
1519 case WINED3D_SM4_DIMENSION_VEC4
:
1520 param
->immconst_type
= WINED3D_IMMCONST_VEC4
;
1523 WARN("Invalid ptr %p, end %p.\n", *ptr
, end
);
1526 memcpy(param
->u
.immconst_data
, *ptr
, 4 * sizeof(DWORD
));
1531 FIXME("Unhandled dimension %#x.\n", dimension
);
1536 map_register(priv
, param
);
1541 static BOOL
shader_sm4_read_src_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
, const DWORD
*end
,
1542 enum wined3d_data_type data_type
, struct wined3d_shader_src_param
*src_param
)
1548 WARN("Invalid ptr %p >= end %p.\n", *ptr
, end
);
1553 if (!shader_sm4_read_param(priv
, ptr
, end
, data_type
, &src_param
->reg
, &src_param
->modifiers
))
1555 ERR("Failed to read parameter.\n");
1559 if (src_param
->reg
.type
== WINED3DSPR_IMMCONST
)
1561 src_param
->swizzle
= WINED3DSP_NOSWIZZLE
;
1565 enum wined3d_sm4_swizzle_type swizzle_type
=
1566 (token
& WINED3D_SM4_SWIZZLE_TYPE_MASK
) >> WINED3D_SM4_SWIZZLE_TYPE_SHIFT
;
1568 switch (swizzle_type
)
1570 case WINED3D_SM4_SWIZZLE_NONE
:
1571 src_param
->swizzle
= WINED3DSP_NOSWIZZLE
;
1574 case WINED3D_SM4_SWIZZLE_SCALAR
:
1575 src_param
->swizzle
= (token
& WINED3D_SM4_SWIZZLE_MASK
) >> WINED3D_SM4_SWIZZLE_SHIFT
;
1576 src_param
->swizzle
= (src_param
->swizzle
& 0x3) * 0x55;
1579 case WINED3D_SM4_SWIZZLE_VEC4
:
1580 src_param
->swizzle
= (token
& WINED3D_SM4_SWIZZLE_MASK
) >> WINED3D_SM4_SWIZZLE_SHIFT
;
1584 FIXME("Unhandled swizzle type %#x.\n", swizzle_type
);
1592 static BOOL
shader_sm4_read_dst_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
, const DWORD
*end
,
1593 enum wined3d_data_type data_type
, struct wined3d_shader_dst_param
*dst_param
)
1595 enum wined3d_shader_src_modifier modifier
;
1600 WARN("Invalid ptr %p >= end %p.\n", *ptr
, end
);
1605 if (!shader_sm4_read_param(priv
, ptr
, end
, data_type
, &dst_param
->reg
, &modifier
))
1607 ERR("Failed to read parameter.\n");
1611 if (modifier
!= WINED3DSPSM_NONE
)
1613 ERR("Invalid source modifier %#x on destination register.\n", modifier
);
1617 dst_param
->write_mask
= (token
& WINED3D_SM4_WRITEMASK_MASK
) >> WINED3D_SM4_WRITEMASK_SHIFT
;
1618 dst_param
->modifiers
= 0;
1619 dst_param
->shift
= 0;
1624 static void shader_sm4_read_instruction_modifier(DWORD modifier
, struct wined3d_shader_instruction
*ins
)
1626 enum wined3d_sm4_instruction_modifier modifier_type
= modifier
& WINED3D_SM4_MODIFIER_MASK
;
1628 switch (modifier_type
)
1630 case WINED3D_SM4_MODIFIER_AOFFIMMI
:
1632 static const DWORD recognized_bits
= WINED3D_SM4_INSTRUCTION_MODIFIER
1633 | WINED3D_SM4_MODIFIER_MASK
1634 | WINED3D_SM4_AOFFIMMI_U_MASK
1635 | WINED3D_SM4_AOFFIMMI_V_MASK
1636 | WINED3D_SM4_AOFFIMMI_W_MASK
;
1638 /* Bit fields are used for sign extension. */
1646 if (modifier
& ~recognized_bits
)
1647 FIXME("Unhandled instruction modifier %#x.\n", modifier
);
1649 aoffimmi
.u
= (modifier
& WINED3D_SM4_AOFFIMMI_U_MASK
) >> WINED3D_SM4_AOFFIMMI_U_SHIFT
;
1650 aoffimmi
.v
= (modifier
& WINED3D_SM4_AOFFIMMI_V_MASK
) >> WINED3D_SM4_AOFFIMMI_V_SHIFT
;
1651 aoffimmi
.w
= (modifier
& WINED3D_SM4_AOFFIMMI_W_MASK
) >> WINED3D_SM4_AOFFIMMI_W_SHIFT
;
1652 ins
->texel_offset
.u
= aoffimmi
.u
;
1653 ins
->texel_offset
.v
= aoffimmi
.v
;
1654 ins
->texel_offset
.w
= aoffimmi
.w
;
1658 case WINED3D_SM5_MODIFIER_DATA_TYPE
:
1660 DWORD components
= (modifier
& WINED3D_SM5_MODIFIER_DATA_TYPE_MASK
) >> WINED3D_SM5_MODIFIER_DATA_TYPE_SHIFT
;
1661 enum wined3d_sm4_data_type data_type
= components
& 0xf;
1663 if ((components
& 0xfff0) != (components
& 0xf) * 0x1110)
1664 FIXME("Components (%#x) have different data types.\n", components
);
1665 ins
->resource_data_type
= data_type_table
[data_type
];
1669 case WINED3D_SM5_MODIFIER_RESOURCE_TYPE
:
1671 enum wined3d_sm4_resource_type resource_type
1672 = (modifier
& WINED3D_SM5_MODIFIER_RESOURCE_TYPE_MASK
) >> WINED3D_SM5_MODIFIER_RESOURCE_TYPE_SHIFT
;
1674 ins
->resource_type
= resource_type_table
[resource_type
];
1679 FIXME("Unhandled instruction modifier %#x.\n", modifier
);
1683 static void shader_sm4_read_instruction(void *data
, const DWORD
**ptr
, struct wined3d_shader_instruction
*ins
)
1685 const struct wined3d_sm4_opcode_info
*opcode_info
;
1686 DWORD opcode_token
, opcode
, previous_token
;
1687 struct wined3d_sm4_data
*priv
= data
;
1688 unsigned int i
, len
;
1693 list_move_head(&priv
->src_free
, &priv
->src
);
1695 if (*ptr
>= priv
->end
)
1697 WARN("End of byte-code, failed to read opcode.\n");
1700 remaining
= priv
->end
- *ptr
;
1702 opcode_token
= *(*ptr
)++;
1703 opcode
= opcode_token
& WINED3D_SM4_OPCODE_MASK
;
1705 len
= ((opcode_token
& WINED3D_SM4_INSTRUCTION_LENGTH_MASK
) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT
);
1710 WARN("End of byte-code, failed to read length token.\n");
1715 if (!len
|| remaining
< len
)
1717 WARN("Read invalid length %u (remaining %lu).\n", len
, remaining
);
1722 if (TRACE_ON(d3d_bytecode
))
1724 TRACE_(d3d_bytecode
)("[ %08x ", opcode_token
);
1725 for (i
= 0; i
< len
; ++i
)
1727 TRACE_(d3d_bytecode
)("%08x ", (*ptr
)[i
]);
1729 TRACE_(d3d_bytecode
)("]\n");
1732 if (!(opcode_info
= get_opcode_info(opcode
)))
1734 FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode
, opcode_token
);
1735 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
1740 ins
->handler_idx
= opcode_info
->handler_idx
;
1743 ins
->predicate
= NULL
;
1744 ins
->dst_count
= strlen(opcode_info
->dst_info
);
1745 ins
->dst
= priv
->dst_param
;
1746 ins
->src_count
= strlen(opcode_info
->src_info
);
1747 ins
->src
= priv
->src_param
;
1748 ins
->resource_type
= WINED3D_SHADER_RESOURCE_NONE
;
1749 ins
->resource_data_type
= WINED3D_DATA_FLOAT
;
1750 memset(&ins
->texel_offset
, 0, sizeof(ins
->texel_offset
));
1755 if (opcode_info
->read_opcode_func
)
1757 opcode_info
->read_opcode_func(ins
, opcode
, opcode_token
, p
, len
, priv
);
1761 enum wined3d_shader_dst_modifier instruction_dst_modifier
= WINED3DSPDM_NONE
;
1763 previous_token
= opcode_token
;
1764 while (previous_token
& WINED3D_SM4_INSTRUCTION_MODIFIER
&& p
!= *ptr
)
1765 shader_sm4_read_instruction_modifier(previous_token
= *p
++, ins
);
1767 ins
->flags
= (opcode_token
& WINED3D_SM4_INSTRUCTION_FLAGS_MASK
) >> WINED3D_SM4_INSTRUCTION_FLAGS_SHIFT
;
1768 if (ins
->flags
& WINED3D_SM4_INSTRUCTION_FLAG_SATURATE
)
1770 ins
->flags
&= ~WINED3D_SM4_INSTRUCTION_FLAG_SATURATE
;
1771 instruction_dst_modifier
= WINED3DSPDM_SATURATE
;
1773 precise
= (opcode_token
& WINED3D_SM5_PRECISE_MASK
) >> WINED3D_SM5_PRECISE_SHIFT
;
1774 ins
->flags
|= precise
<< WINED3DSI_PRECISE_SHIFT
;
1776 for (i
= 0; i
< ins
->dst_count
; ++i
)
1778 if (!(shader_sm4_read_dst_param(priv
, &p
, *ptr
, map_data_type(opcode_info
->dst_info
[i
]),
1779 &priv
->dst_param
[i
])))
1781 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
1784 priv
->dst_param
[i
].modifiers
|= instruction_dst_modifier
;
1787 for (i
= 0; i
< ins
->src_count
; ++i
)
1789 if (!(shader_sm4_read_src_param(priv
, &p
, *ptr
, map_data_type(opcode_info
->src_info
[i
]),
1790 &priv
->src_param
[i
])))
1792 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
1802 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
1806 static BOOL
shader_sm4_is_end(void *data
, const DWORD
**ptr
)
1808 struct wined3d_sm4_data
*priv
= data
;
1809 return *ptr
== priv
->end
;
1812 const struct wined3d_shader_frontend sm4_shader_frontend
=
1816 shader_sm4_read_header
,
1817 shader_sm4_read_instruction
,
1821 #define TAG_AON9 WINEMAKEFOURCC('A', 'o', 'n', '9')
1822 #define TAG_DXBC WINEMAKEFOURCC('D', 'X', 'B', 'C')
1823 #define TAG_ISG1 WINEMAKEFOURCC('I', 'S', 'G', '1')
1824 #define TAG_ISGN WINEMAKEFOURCC('I', 'S', 'G', 'N')
1825 #define TAG_OSG1 WINEMAKEFOURCC('O', 'S', 'G', '1')
1826 #define TAG_OSG5 WINEMAKEFOURCC('O', 'S', 'G', '5')
1827 #define TAG_OSGN WINEMAKEFOURCC('O', 'S', 'G', 'N')
1828 #define TAG_PCSG WINEMAKEFOURCC('P', 'C', 'S', 'G')
1829 #define TAG_PSG1 WINEMAKEFOURCC('P', 'S', 'G', '1')
1830 #define TAG_SHDR WINEMAKEFOURCC('S', 'H', 'D', 'R')
1831 #define TAG_SHEX WINEMAKEFOURCC('S', 'H', 'E', 'X')
1836 DWORD shader_version
;
1838 DWORD byte_code_offset
;
1841 struct shader_handler_context
1843 struct wined3d_shader
*shader
;
1844 enum wined3d_shader_byte_code_format
*format
;
1845 unsigned int max_version
;
1848 static void read_dword(const char **ptr
, DWORD
*d
)
1850 memcpy(d
, *ptr
, sizeof(*d
));
1854 static BOOL
require_space(size_t offset
, size_t count
, size_t size
, size_t data_size
)
1856 return !count
|| (data_size
- offset
) / count
>= size
;
1859 static void skip_dword_unknown(const char **ptr
, unsigned int count
)
1864 WARN("Skipping %u unknown DWORDs:\n", count
);
1865 for (i
= 0; i
< count
; ++i
)
1867 read_dword(ptr
, &d
);
1868 WARN("\t0x%08x\n", d
);
1872 static HRESULT
parse_dxbc(const char *data
, SIZE_T data_size
,
1873 HRESULT (*chunk_handler
)(const char *data
, DWORD data_size
, DWORD tag
, void *ctx
), void *ctx
)
1875 const char *ptr
= data
;
1883 read_dword(&ptr
, &tag
);
1884 TRACE("tag: %s.\n", debugstr_an((const char *)&tag
, 4));
1886 if (tag
!= TAG_DXBC
)
1888 WARN("Wrong tag.\n");
1889 return E_INVALIDARG
;
1892 WARN("Ignoring DXBC checksum.\n");
1893 skip_dword_unknown(&ptr
, 4);
1895 read_dword(&ptr
, &version
);
1896 TRACE("version: %#x.\n", version
);
1897 if (version
!= 0x00000001)
1899 WARN("Got unexpected DXBC version %#x.\n", version
);
1900 return E_INVALIDARG
;
1903 read_dword(&ptr
, &total_size
);
1904 TRACE("total size: %#x\n", total_size
);
1906 read_dword(&ptr
, &chunk_count
);
1907 TRACE("chunk count: %#x\n", chunk_count
);
1909 for (i
= 0; i
< chunk_count
; ++i
)
1911 DWORD chunk_tag
, chunk_size
;
1912 const char *chunk_ptr
;
1915 read_dword(&ptr
, &chunk_offset
);
1916 TRACE("chunk %u at offset %#x\n", i
, chunk_offset
);
1918 if (chunk_offset
>= data_size
|| !require_space(chunk_offset
, 2, sizeof(DWORD
), data_size
))
1920 WARN("Invalid chunk offset %#x (data size %#lx).\n", chunk_offset
, data_size
);
1924 chunk_ptr
= data
+ chunk_offset
;
1926 read_dword(&chunk_ptr
, &chunk_tag
);
1927 read_dword(&chunk_ptr
, &chunk_size
);
1929 if (!require_space(chunk_ptr
- data
, 1, chunk_size
, data_size
))
1931 WARN("Invalid chunk size %#x (data size %#lx, chunk offset %#x).\n",
1932 chunk_size
, data_size
, chunk_offset
);
1936 if (FAILED(hr
= chunk_handler(chunk_ptr
, chunk_size
, chunk_tag
, ctx
)))
1943 static const char *shader_get_string(const char *data
, size_t data_size
, DWORD offset
)
1945 if (offset
>= data_size
)
1947 WARN("Invalid offset %#x (data size %#lx).\n", offset
, (long)data_size
);
1951 if (!memchr( data
+ offset
, 0, data_size
- offset
))
1954 return data
+ offset
;
1957 static HRESULT
shader_parse_signature(DWORD tag
, const char *data
, DWORD data_size
,
1958 struct wined3d_shader_signature
*s
)
1960 struct wined3d_shader_signature_element
*e
;
1961 bool has_stream_index
, has_min_precision
;
1962 const char *ptr
= data
;
1966 if (!require_space(0, 2, sizeof(DWORD
), data_size
))
1968 WARN("Invalid data size %#x.\n", data_size
);
1969 return E_INVALIDARG
;
1972 read_dword(&ptr
, &count
);
1973 TRACE("%u elements.\n", count
);
1975 skip_dword_unknown(&ptr
, 1); /* It seems to always be 0x00000008. */
1977 if (!require_space(ptr
- data
, count
, 6 * sizeof(DWORD
), data_size
))
1979 WARN("Invalid count %#x (data size %#x).\n", count
, data_size
);
1980 return E_INVALIDARG
;
1983 if (!(e
= heap_calloc(count
, sizeof(*e
))))
1985 ERR("Failed to allocate input signature memory.\n");
1986 return E_OUTOFMEMORY
;
1989 has_min_precision
= tag
== TAG_OSG1
|| tag
== TAG_PSG1
|| tag
== TAG_ISG1
;
1990 has_stream_index
= tag
== TAG_OSG5
|| has_min_precision
;
1992 for (i
= 0; i
< count
; ++i
)
1996 if (has_stream_index
)
1997 read_dword(&ptr
, &e
[i
].stream_idx
);
1999 e
[i
].stream_idx
= 0;
2000 read_dword(&ptr
, &name_offset
);
2001 if (!(e
[i
].semantic_name
= shader_get_string(data
, data_size
, name_offset
)))
2003 WARN("Invalid name offset %#x (data size %#x).\n", name_offset
, data_size
);
2005 return E_INVALIDARG
;
2007 read_dword(&ptr
, &e
[i
].semantic_idx
);
2008 read_dword(&ptr
, &e
[i
].sysval_semantic
);
2009 read_dword(&ptr
, &e
[i
].component_type
);
2010 read_dword(&ptr
, &e
[i
].register_idx
);
2011 read_dword(&ptr
, &e
[i
].mask
);
2013 if (has_min_precision
)
2014 read_dword(&ptr
, &e
[i
].min_precision
);
2016 e
[i
].min_precision
= 0;
2018 TRACE("Stream: %u, semantic: %s, semantic idx: %u, sysval_semantic %#x, "
2019 "type %u, register idx: %u, use_mask %#x, input_mask %#x, min_precision %u.\n",
2020 e
[i
].stream_idx
, debugstr_a(e
[i
].semantic_name
), e
[i
].semantic_idx
, e
[i
].sysval_semantic
,
2021 e
[i
].component_type
, e
[i
].register_idx
, (e
[i
].mask
>> 8) & 0xff, e
[i
].mask
& 0xff, e
[i
].min_precision
);
2025 s
->element_count
= count
;
2030 static HRESULT
shader_dxbc_chunk_handler(const char *data
, DWORD data_size
, DWORD tag
, void *context
)
2032 struct shader_handler_context
*ctx
= context
;
2033 struct wined3d_shader
*shader
= ctx
->shader
;
2040 if (ctx
->max_version
< 4)
2042 TRACE("Skipping shader input signature.\n");
2045 if (shader
->input_signature
.elements
)
2047 FIXME("Multiple input signatures.\n");
2050 if (FAILED(hr
= shader_parse_signature(tag
, data
, data_size
, &shader
->input_signature
)))
2057 if (ctx
->max_version
< 4)
2059 TRACE("Skipping shader output signature.\n");
2062 if (shader
->output_signature
.elements
)
2064 FIXME("Multiple output signatures.\n");
2067 if (FAILED(hr
= shader_parse_signature(tag
, data
, data_size
, &shader
->output_signature
)))
2073 if (shader
->patch_constant_signature
.elements
)
2075 FIXME("Multiple patch constant signatures.\n");
2078 if (FAILED(hr
= shader_parse_signature(tag
, data
, data_size
, &shader
->patch_constant_signature
)))
2084 if (ctx
->max_version
< 4)
2086 TRACE("Skipping SM4+ shader.\n");
2089 if (shader
->function
)
2090 FIXME("Multiple shader code chunks.\n");
2091 shader
->function
= (const DWORD
*)data
;
2092 shader
->functionLength
= data_size
;
2093 *ctx
->format
= WINED3D_SHADER_BYTE_CODE_FORMAT_SM4
;
2097 if (ctx
->max_version
< 4)
2099 const struct aon9_header
*header
= (const struct aon9_header
*)data
;
2100 unsigned int unknown_dword_count
;
2101 const char *byte_code
;
2103 if (data_size
< sizeof(*header
))
2105 WARN("Invalid Aon9 data size %#x.\n", data_size
);
2108 byte_code
= data
+ header
->byte_code_offset
;
2109 unknown_dword_count
= (header
->byte_code_offset
- sizeof(*header
)) / sizeof(DWORD
);
2111 if (data_size
- 2 * sizeof(DWORD
) < header
->byte_code_offset
)
2113 WARN("Invalid byte code offset %#x (size %#x).\n", header
->byte_code_offset
, data_size
);
2116 FIXME("Skipping %u unknown DWORDs.\n", unknown_dword_count
);
2118 if (shader
->function
)
2119 FIXME("Multiple shader code chunks.\n");
2120 shader
->function
= (const DWORD
*)byte_code
;
2121 shader
->functionLength
= data_size
- header
->byte_code_offset
;
2122 *ctx
->format
= WINED3D_SHADER_BYTE_CODE_FORMAT_SM1
;
2123 TRACE("Feature level 9 shader version 0%08x, 0%08x.\n",
2124 header
->shader_version
, *shader
->function
);
2128 TRACE("Skipping feature level 9 shader code.\n");
2133 TRACE("Skipping chunk %s.\n", debugstr_an((const char *)&tag
, 4));
2140 HRESULT
shader_extract_from_dxbc(struct wined3d_shader
*shader
,
2141 unsigned int max_shader_version
, enum wined3d_shader_byte_code_format
*format
)
2143 struct shader_handler_context ctx
;
2146 ctx
.shader
= shader
;
2147 ctx
.format
= format
;
2148 ctx
.max_version
= max_shader_version
;
2150 hr
= parse_dxbc(shader
->byte_code
, shader
->byte_code_size
, shader_dxbc_chunk_handler
, &ctx
);
2151 if (!shader
->function
)
2155 WARN("Failed to parse DXBC, hr %#x.\n", hr
);
2160 static HRESULT
shader_isgn_chunk_handler(const char *data
, DWORD data_size
, DWORD tag
, void *ctx
)
2162 struct wined3d_shader_signature
*is
= ctx
;
2164 if (tag
!= TAG_ISGN
)
2169 FIXME("Multiple shader signatures.\n");
2173 return shader_parse_signature(tag
, data
, data_size
, is
);
2176 HRESULT CDECL
wined3d_extract_shader_input_signature_from_dxbc(struct wined3d_shader_signature
*signature
,
2177 const void *code
, SIZE_T code_size
)
2179 memset(signature
, 0, sizeof(*signature
));
2180 return parse_dxbc(code
, code_size
, shader_isgn_chunk_handler
, signature
);