2 * Copyright 2009 Henri Verbeet for CodeWeavers
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
20 #include "wine/port.h"
22 #include "wined3d_private.h"
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader
);
25 WINE_DECLARE_DEBUG_CHANNEL(d3d_bytecode
);
27 #define WINED3D_SM4_INSTRUCTION_MODIFIER (0x1u << 31)
29 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
30 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0x1fu << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
32 #define WINED3D_SM4_RESOURCE_TYPE_SHIFT 11
33 #define WINED3D_SM4_RESOURCE_TYPE_MASK (0xfu << WINED3D_SM4_RESOURCE_TYPE_SHIFT)
35 #define WINED3D_SM4_PRIMITIVE_TYPE_SHIFT 11
36 #define WINED3D_SM4_PRIMITIVE_TYPE_MASK (0x7u << WINED3D_SM4_PRIMITIVE_TYPE_SHIFT)
38 #define WINED3D_SM4_INDEX_TYPE_SHIFT 11
39 #define WINED3D_SM4_INDEX_TYPE_MASK (0x1u << WINED3D_SM4_INDEX_TYPE_SHIFT)
41 #define WINED3D_SM4_OPCODE_MASK 0xff
43 #define WINED3D_SM4_REGISTER_MODIFIER (0x1u << 31)
45 #define WINED3D_SM4_ADDRESSING_SHIFT1 25
46 #define WINED3D_SM4_ADDRESSING_MASK1 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT1)
48 #define WINED3D_SM4_ADDRESSING_SHIFT0 22
49 #define WINED3D_SM4_ADDRESSING_MASK0 (0x3u << WINED3D_SM4_ADDRESSING_SHIFT0)
51 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
52 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3u << WINED3D_SM4_REGISTER_ORDER_SHIFT)
54 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
55 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xfu << WINED3D_SM4_REGISTER_TYPE_SHIFT)
57 #define WINED3D_SM4_SWIZZLE_TYPE_SHIFT 2
58 #define WINED3D_SM4_SWIZZLE_TYPE_MASK (0x3u << WINED3D_SM4_SWIZZLE_TYPE_SHIFT)
60 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT 0
61 #define WINED3D_SM4_IMMCONST_TYPE_MASK (0x3u << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
63 #define WINED3D_SM4_WRITEMASK_SHIFT 4
64 #define WINED3D_SM4_WRITEMASK_MASK (0xfu << WINED3D_SM4_WRITEMASK_SHIFT)
66 #define WINED3D_SM4_SWIZZLE_SHIFT 4
67 #define WINED3D_SM4_SWIZZLE_MASK (0xffu << WINED3D_SM4_SWIZZLE_SHIFT)
69 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
70 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
72 #define WINED3D_SM4_ADDRESSING_RELATIVE 0x2
73 #define WINED3D_SM4_ADDRESSING_OFFSET 0x1
75 enum wined3d_sm4_opcode
77 WINED3D_SM4_OP_ADD
= 0x00,
78 WINED3D_SM4_OP_AND
= 0x01,
79 WINED3D_SM4_OP_BREAK
= 0x02,
80 WINED3D_SM4_OP_BREAKC
= 0x03,
81 WINED3D_SM4_OP_CUT
= 0x09,
82 WINED3D_SM4_OP_DERIV_RTX
= 0x0b,
83 WINED3D_SM4_OP_DERIV_RTY
= 0x0c,
84 WINED3D_SM4_OP_DISCARD
= 0x0d,
85 WINED3D_SM4_OP_DIV
= 0x0e,
86 WINED3D_SM4_OP_DP2
= 0x0f,
87 WINED3D_SM4_OP_DP3
= 0x10,
88 WINED3D_SM4_OP_DP4
= 0x11,
89 WINED3D_SM4_OP_EMIT
= 0x13,
90 WINED3D_SM4_OP_ENDIF
= 0x15,
91 WINED3D_SM4_OP_ENDLOOP
= 0x16,
92 WINED3D_SM4_OP_EQ
= 0x18,
93 WINED3D_SM4_OP_EXP
= 0x19,
94 WINED3D_SM4_OP_FRC
= 0x1a,
95 WINED3D_SM4_OP_FTOI
= 0x1b,
96 WINED3D_SM4_OP_GE
= 0x1d,
97 WINED3D_SM4_OP_IADD
= 0x1e,
98 WINED3D_SM4_OP_IF
= 0x1f,
99 WINED3D_SM4_OP_IEQ
= 0x20,
100 WINED3D_SM4_OP_IGE
= 0x21,
101 WINED3D_SM4_OP_IMUL
= 0x26,
102 WINED3D_SM4_OP_ISHL
= 0x29,
103 WINED3D_SM4_OP_ITOF
= 0x2b,
104 WINED3D_SM4_OP_LD
= 0x2d,
105 WINED3D_SM4_OP_LOG
= 0x2f,
106 WINED3D_SM4_OP_LOOP
= 0x30,
107 WINED3D_SM4_OP_LT
= 0x31,
108 WINED3D_SM4_OP_MAD
= 0x32,
109 WINED3D_SM4_OP_MIN
= 0x33,
110 WINED3D_SM4_OP_MAX
= 0x34,
111 WINED3D_SM4_OP_MOV
= 0x36,
112 WINED3D_SM4_OP_MOVC
= 0x37,
113 WINED3D_SM4_OP_MUL
= 0x38,
114 WINED3D_SM4_OP_NE
= 0x39,
115 WINED3D_SM4_OP_OR
= 0x3c,
116 WINED3D_SM4_OP_RET
= 0x3e,
117 WINED3D_SM4_OP_ROUND_NI
= 0x41,
118 WINED3D_SM4_OP_RSQ
= 0x44,
119 WINED3D_SM4_OP_SAMPLE
= 0x45,
120 WINED3D_SM4_OP_SAMPLE_LOD
= 0x48,
121 WINED3D_SM4_OP_SAMPLE_GRAD
= 0x49,
122 WINED3D_SM4_OP_SQRT
= 0x4b,
123 WINED3D_SM4_OP_SINCOS
= 0x4d,
124 WINED3D_SM4_OP_UDIV
= 0x4e,
125 WINED3D_SM4_OP_UGE
= 0x50,
126 WINED3D_SM4_OP_USHR
= 0x55,
127 WINED3D_SM4_OP_UTOF
= 0x56,
128 WINED3D_SM4_OP_XOR
= 0x57,
129 WINED3D_SM4_OP_DCL_RESOURCE
= 0x58,
130 WINED3D_SM4_OP_DCL_CONSTANT_BUFFER
= 0x59,
131 WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY
= 0x5c,
132 WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE
= 0x5d,
133 WINED3D_SM4_OP_DCL_VERTICES_OUT
= 0x5e,
136 enum wined3d_sm4_register_type
138 WINED3D_SM4_RT_TEMP
= 0x0,
139 WINED3D_SM4_RT_INPUT
= 0x1,
140 WINED3D_SM4_RT_OUTPUT
= 0x2,
141 WINED3D_SM4_RT_IMMCONST
= 0x4,
142 WINED3D_SM4_RT_SAMPLER
= 0x6,
143 WINED3D_SM4_RT_RESOURCE
= 0x7,
144 WINED3D_SM4_RT_CONSTBUFFER
= 0x8,
145 WINED3D_SM4_RT_PRIMID
= 0xb,
146 WINED3D_SM4_RT_NULL
= 0xd,
149 enum wined3d_sm4_output_primitive_type
151 WINED3D_SM4_OUTPUT_PT_POINTLIST
= 0x1,
152 WINED3D_SM4_OUTPUT_PT_LINELIST
= 0x3,
153 WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP
= 0x5,
156 enum wined3d_sm4_input_primitive_type
158 WINED3D_SM4_INPUT_PT_POINT
= 0x1,
159 WINED3D_SM4_INPUT_PT_LINE
= 0x2,
160 WINED3D_SM4_INPUT_PT_TRIANGLE
= 0x3,
161 WINED3D_SM4_INPUT_PT_LINEADJ
= 0x6,
162 WINED3D_SM4_INPUT_PT_TRIANGLEADJ
= 0x7,
165 enum wined3d_sm4_swizzle_type
167 WINED3D_SM4_SWIZZLE_VEC4
= 0x1,
168 WINED3D_SM4_SWIZZLE_SCALAR
= 0x2,
171 enum wined3d_sm4_immconst_type
173 WINED3D_SM4_IMMCONST_SCALAR
= 0x1,
174 WINED3D_SM4_IMMCONST_VEC4
= 0x2,
177 enum wined3d_sm4_resource_type
179 WINED3D_SM4_RESOURCE_BUFFER
= 0x1,
180 WINED3D_SM4_RESOURCE_TEXTURE_1D
= 0x2,
181 WINED3D_SM4_RESOURCE_TEXTURE_2D
= 0x3,
182 WINED3D_SM4_RESOURCE_TEXTURE_2DMS
= 0x4,
183 WINED3D_SM4_RESOURCE_TEXTURE_3D
= 0x5,
184 WINED3D_SM4_RESOURCE_TEXTURE_CUBE
= 0x6,
185 WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY
= 0x7,
186 WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY
= 0x8,
187 WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY
= 0x9,
190 enum wined3d_sm4_data_type
192 WINED3D_SM4_DATA_UNORM
= 0x1,
193 WINED3D_SM4_DATA_SNORM
= 0x2,
194 WINED3D_SM4_DATA_INT
= 0x3,
195 WINED3D_SM4_DATA_UINT
= 0x4,
196 WINED3D_SM4_DATA_FLOAT
= 0x5,
199 struct wined3d_shader_src_param_entry
202 struct wined3d_shader_src_param param
;
205 struct wined3d_sm4_data
207 struct wined3d_shader_version shader_version
;
212 enum wined3d_shader_register_type register_type
;
214 } output_map
[MAX_REG_OUTPUT
];
216 struct wined3d_shader_src_param src_param
[5];
217 struct wined3d_shader_dst_param dst_param
[2];
218 struct list src_free
;
222 struct wined3d_sm4_opcode_info
224 enum wined3d_sm4_opcode opcode
;
225 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx
;
226 const char *dst_info
;
227 const char *src_info
;
232 enum wined3d_sysval_semantic sysval
;
233 enum wined3d_shader_register_type register_type
;
238 * F -> WINED3D_DATA_FLOAT
239 * I -> WINED3D_DATA_INT
240 * R -> WINED3D_DATA_RESOURCE
241 * S -> WINED3D_DATA_SAMPLER
242 * U -> WINED3D_DATA_UINT
244 static const struct wined3d_sm4_opcode_info opcode_table
[] =
246 {WINED3D_SM4_OP_ADD
, WINED3DSIH_ADD
, "F", "FF"},
247 {WINED3D_SM4_OP_AND
, WINED3DSIH_AND
, "U", "UU"},
248 {WINED3D_SM4_OP_BREAK
, WINED3DSIH_BREAK
, "", ""},
249 {WINED3D_SM4_OP_BREAKC
, WINED3DSIH_BREAKP
, "", "U"},
250 {WINED3D_SM4_OP_CUT
, WINED3DSIH_CUT
, "", ""},
251 {WINED3D_SM4_OP_DERIV_RTX
, WINED3DSIH_DSX
, "F", "F"},
252 {WINED3D_SM4_OP_DERIV_RTY
, WINED3DSIH_DSY
, "F", "F"},
253 {WINED3D_SM4_OP_DISCARD
, WINED3DSIH_TEXKILL
, "", "U"},
254 {WINED3D_SM4_OP_DIV
, WINED3DSIH_DIV
, "F", "FF"},
255 {WINED3D_SM4_OP_DP2
, WINED3DSIH_DP2
, "F", "FF"},
256 {WINED3D_SM4_OP_DP3
, WINED3DSIH_DP3
, "F", "FF"},
257 {WINED3D_SM4_OP_DP4
, WINED3DSIH_DP4
, "F", "FF"},
258 {WINED3D_SM4_OP_EMIT
, WINED3DSIH_EMIT
, "", ""},
259 {WINED3D_SM4_OP_ENDIF
, WINED3DSIH_ENDIF
, "", ""},
260 {WINED3D_SM4_OP_ENDLOOP
, WINED3DSIH_ENDLOOP
, "", ""},
261 {WINED3D_SM4_OP_EQ
, WINED3DSIH_EQ
, "U", "FF"},
262 {WINED3D_SM4_OP_EXP
, WINED3DSIH_EXP
, "F", "F"},
263 {WINED3D_SM4_OP_FRC
, WINED3DSIH_FRC
, "F", "F"},
264 {WINED3D_SM4_OP_FTOI
, WINED3DSIH_FTOI
, "I", "F"},
265 {WINED3D_SM4_OP_GE
, WINED3DSIH_GE
, "U", "FF"},
266 {WINED3D_SM4_OP_IADD
, WINED3DSIH_IADD
, "I", "II"},
267 {WINED3D_SM4_OP_IF
, WINED3DSIH_IF
, "", "U"},
268 {WINED3D_SM4_OP_IEQ
, WINED3DSIH_IEQ
, "U", "II"},
269 {WINED3D_SM4_OP_IGE
, WINED3DSIH_IGE
, "U", "II"},
270 {WINED3D_SM4_OP_IMUL
, WINED3DSIH_IMUL
, "II", "II"},
271 {WINED3D_SM4_OP_ISHL
, WINED3DSIH_ISHL
, "I", "II"},
272 {WINED3D_SM4_OP_ITOF
, WINED3DSIH_ITOF
, "F", "I"},
273 {WINED3D_SM4_OP_LD
, WINED3DSIH_LD
, "U", "FR"},
274 {WINED3D_SM4_OP_LOG
, WINED3DSIH_LOG
, "F", "F"},
275 {WINED3D_SM4_OP_LOOP
, WINED3DSIH_LOOP
, "", ""},
276 {WINED3D_SM4_OP_LT
, WINED3DSIH_LT
, "U", "FF"},
277 {WINED3D_SM4_OP_MAD
, WINED3DSIH_MAD
, "F", "FFF"},
278 {WINED3D_SM4_OP_MIN
, WINED3DSIH_MIN
, "F", "FF"},
279 {WINED3D_SM4_OP_MAX
, WINED3DSIH_MAX
, "F", "FF"},
280 {WINED3D_SM4_OP_MOV
, WINED3DSIH_MOV
, "F", "F"},
281 {WINED3D_SM4_OP_MOVC
, WINED3DSIH_MOVC
, "F", "UFF"},
282 {WINED3D_SM4_OP_MUL
, WINED3DSIH_MUL
, "F", "FF"},
283 {WINED3D_SM4_OP_NE
, WINED3DSIH_NE
, "U", "FF"},
284 {WINED3D_SM4_OP_OR
, WINED3DSIH_OR
, "U", "UU"},
285 {WINED3D_SM4_OP_RET
, WINED3DSIH_RET
, "", ""},
286 {WINED3D_SM4_OP_ROUND_NI
, WINED3DSIH_ROUND_NI
, "F", "F"},
287 {WINED3D_SM4_OP_RSQ
, WINED3DSIH_RSQ
, "F", "F"},
288 {WINED3D_SM4_OP_SAMPLE
, WINED3DSIH_SAMPLE
, "U", "FRS"},
289 {WINED3D_SM4_OP_SAMPLE_LOD
, WINED3DSIH_SAMPLE_LOD
, "U", "FRSF"},
290 {WINED3D_SM4_OP_SAMPLE_GRAD
, WINED3DSIH_SAMPLE_GRAD
, "U", "FRSFF"},
291 {WINED3D_SM4_OP_SQRT
, WINED3DSIH_SQRT
, "F", "F"},
292 {WINED3D_SM4_OP_SINCOS
, WINED3DSIH_SINCOS
, "FF", "F"},
293 {WINED3D_SM4_OP_UDIV
, WINED3DSIH_UDIV
, "UU", "UU"},
294 {WINED3D_SM4_OP_UGE
, WINED3DSIH_UGE
, "U", "UU"},
295 {WINED3D_SM4_OP_USHR
, WINED3DSIH_USHR
, "U", "UU"},
296 {WINED3D_SM4_OP_UTOF
, WINED3DSIH_UTOF
, "F", "U"},
297 {WINED3D_SM4_OP_XOR
, WINED3DSIH_XOR
, "U", "UU"},
298 {WINED3D_SM4_OP_DCL_RESOURCE
, WINED3DSIH_DCL
, "R", ""},
299 {WINED3D_SM4_OP_DCL_CONSTANT_BUFFER
, WINED3DSIH_DCL_CONSTANT_BUFFER
, "", ""},
300 {WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY
, WINED3DSIH_DCL_OUTPUT_TOPOLOGY
, "", ""},
301 {WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE
, WINED3DSIH_DCL_INPUT_PRIMITIVE
, "", ""},
302 {WINED3D_SM4_OP_DCL_VERTICES_OUT
, WINED3DSIH_DCL_VERTICES_OUT
, "", ""},
305 static const enum wined3d_shader_register_type register_type_table
[] =
307 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP
,
308 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT
,
309 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT
,
311 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST
,
313 /* WINED3D_SM4_RT_SAMPLER */ WINED3DSPR_SAMPLER
,
314 /* WINED3D_SM4_RT_RESOURCE */ WINED3DSPR_RESOURCE
,
315 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER
,
318 /* WINED3D_SM4_RT_PRIMID */ WINED3DSPR_PRIMID
,
320 /* WINED3D_SM4_RT_NULL */ WINED3DSPR_NULL
,
323 static const enum wined3d_primitive_type output_primitive_type_table
[] =
325 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
326 /* WINED3D_SM4_OUTPUT_PT_POINTLIST */ WINED3D_PT_POINTLIST
,
327 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
328 /* WINED3D_SM4_OUTPUT_PT_LINELIST */ WINED3D_PT_LINELIST
,
329 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
330 /* WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP */ WINED3D_PT_TRIANGLESTRIP
,
333 static const enum wined3d_primitive_type input_primitive_type_table
[] =
335 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
336 /* WINED3D_SM4_INPUT_PT_POINT */ WINED3D_PT_POINTLIST
,
337 /* WINED3D_SM4_INPUT_PT_LINE */ WINED3D_PT_LINELIST
,
338 /* WINED3D_SM4_INPUT_PT_TRIANGLE */ WINED3D_PT_TRIANGLELIST
,
339 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
340 /* UNKNOWN */ WINED3D_PT_UNDEFINED
,
341 /* WINED3D_SM4_INPUT_PT_LINEADJ */ WINED3D_PT_LINELIST_ADJ
,
342 /* WINED3D_SM4_INPUT_PT_TRIANGLEADJ */ WINED3D_PT_TRIANGLELIST_ADJ
,
345 static const struct sysval_map sysval_map
[] =
347 {WINED3D_SV_DEPTH
, WINED3DSPR_DEPTHOUT
, 0},
348 {WINED3D_SV_TARGET0
, WINED3DSPR_COLOROUT
, 0},
349 {WINED3D_SV_TARGET1
, WINED3DSPR_COLOROUT
, 1},
350 {WINED3D_SV_TARGET2
, WINED3DSPR_COLOROUT
, 2},
351 {WINED3D_SV_TARGET3
, WINED3DSPR_COLOROUT
, 3},
352 {WINED3D_SV_TARGET4
, WINED3DSPR_COLOROUT
, 4},
353 {WINED3D_SV_TARGET5
, WINED3DSPR_COLOROUT
, 5},
354 {WINED3D_SV_TARGET6
, WINED3DSPR_COLOROUT
, 6},
355 {WINED3D_SV_TARGET7
, WINED3DSPR_COLOROUT
, 7},
358 static const enum wined3d_shader_resource_type resource_type_table
[] =
360 /* 0 */ WINED3D_SHADER_RESOURCE_NONE
,
361 /* WINED3D_SM4_RESOURCE_BUFFER */ WINED3D_SHADER_RESOURCE_BUFFER
,
362 /* WINED3D_SM4_RESOURCE_TEXTURE_1D */ WINED3D_SHADER_RESOURCE_TEXTURE_1D
,
363 /* WINED3D_SM4_RESOURCE_TEXTURE_2D */ WINED3D_SHADER_RESOURCE_TEXTURE_2D
,
364 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMS */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMS
,
365 /* WINED3D_SM4_RESOURCE_TEXTURE_3D */ WINED3D_SHADER_RESOURCE_TEXTURE_3D
,
366 /* WINED3D_SM4_RESOURCE_TEXTURE_CUBE */ WINED3D_SHADER_RESOURCE_TEXTURE_CUBE
,
367 /* WINED3D_SM4_RESOURCE_TEXTURE_1DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_1DARRAY
,
368 /* WINED3D_SM4_RESOURCE_TEXTURE_2DARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DARRAY
,
369 /* WINED3D_SM4_RESOURCE_TEXTURE_2DMSARRAY */ WINED3D_SHADER_RESOURCE_TEXTURE_2DMSARRAY
,
372 static const enum wined3d_data_type data_type_table
[] =
374 /* 0 */ WINED3D_DATA_FLOAT
,
375 /* WINED3D_SM4_DATA_UNORM */ WINED3D_DATA_UNORM
,
376 /* WINED3D_SM4_DATA_SNORM */ WINED3D_DATA_SNORM
,
377 /* WINED3D_SM4_DATA_INT */ WINED3D_DATA_INT
,
378 /* WINED3D_SM4_DATA_UINT */ WINED3D_DATA_UINT
,
379 /* WINED3D_SM4_DATA_FLOAT */ WINED3D_DATA_FLOAT
,
382 static BOOL
shader_sm4_read_src_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
,
383 enum wined3d_data_type data_type
, struct wined3d_shader_src_param
*src_param
);
385 static const struct wined3d_sm4_opcode_info
*get_opcode_info(enum wined3d_sm4_opcode opcode
)
389 for (i
= 0; i
< sizeof(opcode_table
) / sizeof(*opcode_table
); ++i
)
391 if (opcode
== opcode_table
[i
].opcode
) return &opcode_table
[i
];
397 static void map_register(const struct wined3d_sm4_data
*priv
, struct wined3d_shader_register
*reg
)
399 switch (priv
->shader_version
.type
)
401 case WINED3D_SHADER_TYPE_PIXEL
:
402 if (reg
->type
== WINED3DSPR_OUTPUT
)
404 unsigned int reg_idx
= reg
->idx
[0].offset
;
406 if (reg_idx
>= ARRAY_SIZE(priv
->output_map
))
408 ERR("Invalid output index %u.\n", reg_idx
);
412 reg
->type
= priv
->output_map
[reg_idx
].register_type
;
413 reg
->idx
[0].offset
= priv
->output_map
[reg_idx
].register_idx
;
422 static enum wined3d_data_type
map_data_type(char t
)
427 return WINED3D_DATA_FLOAT
;
429 return WINED3D_DATA_INT
;
431 return WINED3D_DATA_RESOURCE
;
433 return WINED3D_DATA_SAMPLER
;
435 return WINED3D_DATA_UINT
;
437 ERR("Invalid data type '%c'.\n", t
);
438 return WINED3D_DATA_FLOAT
;
442 static void *shader_sm4_init(const DWORD
*byte_code
, const struct wined3d_shader_signature
*output_signature
)
444 struct wined3d_sm4_data
*priv
;
447 if (!(priv
= HeapAlloc(GetProcessHeap(), 0, sizeof(*priv
))))
449 ERR("Failed to allocate private data\n");
453 memset(priv
->output_map
, 0xff, sizeof(priv
->output_map
));
454 for (i
= 0; i
< output_signature
->element_count
; ++i
)
456 struct wined3d_shader_signature_element
*e
= &output_signature
->elements
[i
];
458 if (e
->register_idx
>= ARRAY_SIZE(priv
->output_map
))
460 WARN("Invalid output index %u.\n", e
->register_idx
);
464 for (j
= 0; j
< ARRAY_SIZE(sysval_map
); ++j
)
466 if (e
->sysval_semantic
== sysval_map
[j
].sysval
)
468 priv
->output_map
[e
->register_idx
].register_type
= sysval_map
[j
].register_type
;
469 priv
->output_map
[e
->register_idx
].register_idx
= sysval_map
[j
].register_idx
;
475 list_init(&priv
->src_free
);
476 list_init(&priv
->src
);
481 static void shader_sm4_free(void *data
)
483 struct wined3d_shader_src_param_entry
*e1
, *e2
;
484 struct wined3d_sm4_data
*priv
= data
;
486 list_move_head(&priv
->src_free
, &priv
->src
);
487 LIST_FOR_EACH_ENTRY_SAFE(e1
, e2
, &priv
->src_free
, struct wined3d_shader_src_param_entry
, entry
)
489 HeapFree(GetProcessHeap(), 0, e1
);
491 HeapFree(GetProcessHeap(), 0, priv
);
494 static struct wined3d_shader_src_param
*get_src_param(struct wined3d_sm4_data
*priv
)
496 struct wined3d_shader_src_param_entry
*e
;
499 if (!list_empty(&priv
->src_free
))
501 elem
= list_head(&priv
->src_free
);
506 if (!(e
= HeapAlloc(GetProcessHeap(), 0, sizeof(*e
))))
511 list_add_tail(&priv
->src
, elem
);
512 e
= LIST_ENTRY(elem
, struct wined3d_shader_src_param_entry
, entry
);
516 static void shader_sm4_read_header(void *data
, const DWORD
**ptr
, struct wined3d_shader_version
*shader_version
)
518 struct wined3d_sm4_data
*priv
= data
;
523 version_token
= *(*ptr
)++;
524 TRACE("version: 0x%08x\n", version_token
);
526 TRACE("token count: %u\n", **ptr
);
527 priv
->end
+= *(*ptr
)++;
529 switch (version_token
>> 16)
532 priv
->shader_version
.type
= WINED3D_SHADER_TYPE_PIXEL
;
536 priv
->shader_version
.type
= WINED3D_SHADER_TYPE_VERTEX
;
540 priv
->shader_version
.type
= WINED3D_SHADER_TYPE_GEOMETRY
;
544 FIXME("Unrecognized shader type %#x\n", version_token
>> 16);
546 priv
->shader_version
.major
= WINED3D_SM4_VERSION_MAJOR(version_token
);
547 priv
->shader_version
.minor
= WINED3D_SM4_VERSION_MINOR(version_token
);
549 *shader_version
= priv
->shader_version
;
552 static BOOL
shader_sm4_read_reg_idx(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
,
553 DWORD addressing
, struct wined3d_shader_register_index
*reg_idx
)
555 if (addressing
& WINED3D_SM4_ADDRESSING_RELATIVE
)
557 struct wined3d_shader_src_param
*rel_addr
= get_src_param(priv
);
559 if (!(reg_idx
->rel_addr
= rel_addr
))
561 ERR("Failed to get src param for relative addressing.\n");
565 if (addressing
& WINED3D_SM4_ADDRESSING_OFFSET
)
566 reg_idx
->offset
= *(*ptr
)++;
569 shader_sm4_read_src_param(priv
, ptr
, WINED3D_DATA_INT
, rel_addr
);
573 reg_idx
->rel_addr
= NULL
;
574 reg_idx
->offset
= *(*ptr
)++;
580 static BOOL
shader_sm4_read_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
,
581 enum wined3d_data_type data_type
, struct wined3d_shader_register
*param
,
582 enum wined3d_shader_src_modifier
*modifier
)
584 enum wined3d_sm4_register_type register_type
;
585 DWORD token
= *(*ptr
)++;
588 register_type
= (token
& WINED3D_SM4_REGISTER_TYPE_MASK
) >> WINED3D_SM4_REGISTER_TYPE_SHIFT
;
589 if (register_type
>= sizeof(register_type_table
) / sizeof(*register_type_table
))
591 FIXME("Unhandled register type %#x.\n", register_type
);
592 param
->type
= WINED3DSPR_TEMP
;
596 param
->type
= register_type_table
[register_type
];
598 param
->data_type
= data_type
;
600 if (token
& WINED3D_SM4_REGISTER_MODIFIER
)
604 /* FIXME: This will probably break down at some point. The SM4
605 * modifiers look like flags, while wined3d currently has an enum
606 * with possible combinations, e.g. WINED3DSPSM_ABSNEG. */
610 *modifier
= WINED3DSPSM_NEG
;
614 *modifier
= WINED3DSPSM_ABS
;
618 FIXME("Skipping modifier 0x%08x.\n", m
);
619 *modifier
= WINED3DSPSM_NONE
;
625 *modifier
= WINED3DSPSM_NONE
;
628 order
= (token
& WINED3D_SM4_REGISTER_ORDER_MASK
) >> WINED3D_SM4_REGISTER_ORDER_SHIFT
;
631 param
->idx
[0].offset
= ~0U;
634 DWORD addressing
= (token
& WINED3D_SM4_ADDRESSING_MASK0
) >> WINED3D_SM4_ADDRESSING_SHIFT0
;
635 if (!(shader_sm4_read_reg_idx(priv
, ptr
, addressing
, ¶m
->idx
[0])))
637 ERR("Failed to read register index.\n");
643 param
->idx
[1].offset
= ~0U;
646 DWORD addressing
= (token
& WINED3D_SM4_ADDRESSING_MASK1
) >> WINED3D_SM4_ADDRESSING_SHIFT1
;
647 if (!(shader_sm4_read_reg_idx(priv
, ptr
, addressing
, ¶m
->idx
[1])))
649 ERR("Failed to read register index.\n");
655 FIXME("Unhandled order %u.\n", order
);
657 if (register_type
== WINED3D_SM4_RT_IMMCONST
)
659 enum wined3d_sm4_immconst_type immconst_type
=
660 (token
& WINED3D_SM4_IMMCONST_TYPE_MASK
) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT
;
662 switch (immconst_type
)
664 case WINED3D_SM4_IMMCONST_SCALAR
:
665 param
->immconst_type
= WINED3D_IMMCONST_SCALAR
;
666 memcpy(param
->immconst_data
, *ptr
, 1 * sizeof(DWORD
));
670 case WINED3D_SM4_IMMCONST_VEC4
:
671 param
->immconst_type
= WINED3D_IMMCONST_VEC4
;
672 memcpy(param
->immconst_data
, *ptr
, 4 * sizeof(DWORD
));
677 FIXME("Unhandled immediate constant type %#x.\n", immconst_type
);
682 map_register(priv
, param
);
687 static BOOL
shader_sm4_read_src_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
,
688 enum wined3d_data_type data_type
, struct wined3d_shader_src_param
*src_param
)
692 if (!shader_sm4_read_param(priv
, ptr
, data_type
, &src_param
->reg
, &src_param
->modifiers
))
694 ERR("Failed to read parameter.\n");
698 if (src_param
->reg
.type
== WINED3DSPR_IMMCONST
)
700 src_param
->swizzle
= WINED3DSP_NOSWIZZLE
;
704 enum wined3d_sm4_swizzle_type swizzle_type
=
705 (token
& WINED3D_SM4_SWIZZLE_TYPE_MASK
) >> WINED3D_SM4_SWIZZLE_TYPE_SHIFT
;
707 switch (swizzle_type
)
709 case WINED3D_SM4_SWIZZLE_SCALAR
:
710 src_param
->swizzle
= (token
& WINED3D_SM4_SWIZZLE_MASK
) >> WINED3D_SM4_SWIZZLE_SHIFT
;
711 src_param
->swizzle
= (src_param
->swizzle
& 0x3) * 0x55;
714 case WINED3D_SM4_SWIZZLE_VEC4
:
715 src_param
->swizzle
= (token
& WINED3D_SM4_SWIZZLE_MASK
) >> WINED3D_SM4_SWIZZLE_SHIFT
;
719 FIXME("Unhandled swizzle type %#x.\n", swizzle_type
);
727 static BOOL
shader_sm4_read_dst_param(struct wined3d_sm4_data
*priv
, const DWORD
**ptr
,
728 enum wined3d_data_type data_type
, struct wined3d_shader_dst_param
*dst_param
)
730 enum wined3d_shader_src_modifier modifier
;
733 if (!shader_sm4_read_param(priv
, ptr
, data_type
, &dst_param
->reg
, &modifier
))
735 ERR("Failed to read parameter.\n");
739 if (modifier
!= WINED3DSPSM_NONE
)
741 ERR("Invalid source modifier %#x on destination register.\n", modifier
);
745 dst_param
->write_mask
= (token
& WINED3D_SM4_WRITEMASK_MASK
) >> WINED3D_SM4_WRITEMASK_SHIFT
;
746 dst_param
->modifiers
= 0;
747 dst_param
->shift
= 0;
752 static void shader_sm4_read_instruction(void *data
, const DWORD
**ptr
, struct wined3d_shader_instruction
*ins
)
754 const struct wined3d_sm4_opcode_info
*opcode_info
;
755 struct wined3d_sm4_data
*priv
= data
;
756 DWORD opcode_token
, opcode
;
760 list_move_head(&priv
->src_free
, &priv
->src
);
762 opcode_token
= *(*ptr
)++;
763 opcode
= opcode_token
& WINED3D_SM4_OPCODE_MASK
;
764 len
= ((opcode_token
& WINED3D_SM4_INSTRUCTION_LENGTH_MASK
) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT
) - 1;
766 if (TRACE_ON(d3d_bytecode
))
768 TRACE_(d3d_bytecode
)("[ %08x ", opcode_token
);
769 for (i
= 0; i
< len
; ++i
)
771 TRACE_(d3d_bytecode
)("%08x ", (*ptr
)[i
]);
773 TRACE_(d3d_bytecode
)("]\n");
776 if (!(opcode_info
= get_opcode_info(opcode
)))
778 FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode
, opcode_token
);
779 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
784 ins
->handler_idx
= opcode_info
->handler_idx
;
787 ins
->predicate
= NULL
;
788 ins
->dst_count
= strlen(opcode_info
->dst_info
);
789 ins
->dst
= priv
->dst_param
;
790 ins
->src_count
= strlen(opcode_info
->src_info
);
791 ins
->src
= priv
->src_param
;
796 if (opcode_token
& WINED3D_SM4_INSTRUCTION_MODIFIER
)
798 DWORD modifier
= *p
++;
799 FIXME("Skipping modifier 0x%08x.\n", modifier
);
802 if (opcode
== WINED3D_SM4_OP_DCL_RESOURCE
)
804 enum wined3d_sm4_resource_type resource_type
;
805 enum wined3d_sm4_data_type data_type
;
808 resource_type
= (opcode_token
& WINED3D_SM4_RESOURCE_TYPE_MASK
) >> WINED3D_SM4_RESOURCE_TYPE_SHIFT
;
809 if (!resource_type
|| (resource_type
>= ARRAY_SIZE(resource_type_table
)))
811 FIXME("Unhandled resource type %#x.\n", resource_type
);
812 ins
->declaration
.semantic
.resource_type
= WINED3D_SHADER_RESOURCE_NONE
;
816 ins
->declaration
.semantic
.resource_type
= resource_type_table
[resource_type
];
818 shader_sm4_read_dst_param(priv
, &p
, WINED3D_DATA_RESOURCE
, &ins
->declaration
.semantic
.reg
);
821 if ((components
& 0xfff0) != (components
& 0xf) * 0x1110)
822 FIXME("Components (%#x) have different data types.\n", components
);
823 data_type
= components
& 0xf;
825 if (!data_type
|| (data_type
>= ARRAY_SIZE(data_type_table
)))
827 FIXME("Unhandled data type %#x.\n", data_type
);
828 ins
->declaration
.semantic
.resource_data_type
= WINED3D_DATA_FLOAT
;
832 ins
->declaration
.semantic
.resource_data_type
= data_type_table
[data_type
];
835 else if (opcode
== WINED3D_SM4_OP_DCL_CONSTANT_BUFFER
)
837 shader_sm4_read_src_param(priv
, &p
, WINED3D_DATA_FLOAT
, &ins
->declaration
.src
);
838 if (opcode_token
& WINED3D_SM4_INDEX_TYPE_MASK
)
839 ins
->flags
|= WINED3DSI_INDEXED_DYNAMIC
;
841 else if (opcode
== WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY
)
843 enum wined3d_sm4_output_primitive_type primitive_type
;
845 primitive_type
= (opcode_token
& WINED3D_SM4_PRIMITIVE_TYPE_MASK
) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT
;
846 if (primitive_type
>= sizeof(output_primitive_type_table
) / sizeof(*output_primitive_type_table
))
848 FIXME("Unhandled output primitive type %#x.\n", primitive_type
);
849 ins
->declaration
.primitive_type
= WINED3D_PT_UNDEFINED
;
853 ins
->declaration
.primitive_type
= output_primitive_type_table
[primitive_type
];
856 else if (opcode
== WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE
)
858 enum wined3d_sm4_input_primitive_type primitive_type
;
860 primitive_type
= (opcode_token
& WINED3D_SM4_PRIMITIVE_TYPE_MASK
) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT
;
861 if (primitive_type
>= sizeof(input_primitive_type_table
) / sizeof(*input_primitive_type_table
))
863 FIXME("Unhandled input primitive type %#x.\n", primitive_type
);
864 ins
->declaration
.primitive_type
= WINED3D_PT_UNDEFINED
;
868 ins
->declaration
.primitive_type
= input_primitive_type_table
[primitive_type
];
871 else if (opcode
== WINED3D_SM4_OP_DCL_VERTICES_OUT
)
873 ins
->declaration
.count
= *p
++;
877 for (i
= 0; i
< ins
->dst_count
; ++i
)
879 if (!(shader_sm4_read_dst_param(priv
, &p
, map_data_type(opcode_info
->dst_info
[i
]), &priv
->dst_param
[i
])))
881 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
886 for (i
= 0; i
< ins
->src_count
; ++i
)
888 if (!(shader_sm4_read_src_param(priv
, &p
, map_data_type(opcode_info
->src_info
[i
]), &priv
->src_param
[i
])))
890 ins
->handler_idx
= WINED3DSIH_TABLE_SIZE
;
897 static BOOL
shader_sm4_is_end(void *data
, const DWORD
**ptr
)
899 struct wined3d_sm4_data
*priv
= data
;
900 return *ptr
== priv
->end
;
903 const struct wined3d_shader_frontend sm4_shader_frontend
=
907 shader_sm4_read_header
,
908 shader_sm4_read_instruction
,