wined3d: Recognize the SM4 lt opcode.
[wine/multimedia.git] / dlls / wined3d / shader_sm4.c
blobb935eefc1ef4e66d0b7af2983a4f737b7360bf5c
1 /*
2 * Copyright 2009 Henri Verbeet for CodeWeavers
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with this library; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
19 #include "config.h"
20 #include "wine/port.h"
22 #include "wined3d_private.h"
24 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
26 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT 24
27 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK (0xf << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
29 #define WINED3D_SM4_OPCODE_MASK 0xff
31 #define WINED3D_SM4_REGISTER_ORDER_SHIFT 20
32 #define WINED3D_SM4_REGISTER_ORDER_MASK (0x3 << WINED3D_SM4_REGISTER_ORDER_SHIFT)
34 #define WINED3D_SM4_REGISTER_TYPE_SHIFT 12
35 #define WINED3D_SM4_REGISTER_TYPE_MASK (0xf << WINED3D_SM4_REGISTER_TYPE_SHIFT)
37 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT 0
38 #define WINED3D_SM4_IMMCONST_TYPE_MASK (0x3 << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
40 #define WINED3D_SM4_WRITEMASK_SHIFT 4
41 #define WINED3D_SM4_WRITEMASK_MASK (0xf << WINED3D_SM4_WRITEMASK_SHIFT)
43 #define WINED3D_SM4_SWIZZLE_SHIFT 4
44 #define WINED3D_SM4_SWIZZLE_MASK (0xff << WINED3D_SM4_SWIZZLE_SHIFT)
46 #define WINED3D_SM4_VERSION_MAJOR(version) (((version) >> 4) & 0xf)
47 #define WINED3D_SM4_VERSION_MINOR(version) (((version) >> 0) & 0xf)
49 enum wined3d_sm4_opcode
51 WINED3D_SM4_OP_ADD = 0x00,
52 WINED3D_SM4_OP_BREAKC = 0x03,
53 WINED3D_SM4_OP_DP3 = 0x10,
54 WINED3D_SM4_OP_DP4 = 0x11,
55 WINED3D_SM4_OP_EMIT = 0x13,
56 WINED3D_SM4_OP_EXP = 0x19,
57 WINED3D_SM4_OP_IADD = 0x1e,
58 WINED3D_SM4_OP_IGE = 0x21,
59 WINED3D_SM4_OP_LOG = 0x2f,
60 WINED3D_SM4_OP_LT = 0x31,
61 WINED3D_SM4_OP_MIN = 0x33,
62 WINED3D_SM4_OP_MAX = 0x34,
63 WINED3D_SM4_OP_MOV = 0x36,
64 WINED3D_SM4_OP_MUL = 0x38,
65 WINED3D_SM4_OP_RET = 0x3e,
66 WINED3D_SM4_OP_RSQ = 0x44,
67 WINED3D_SM4_OP_SINCOS = 0x4d,
70 enum wined3d_sm4_register_type
72 WINED3D_SM4_RT_TEMP = 0x0,
73 WINED3D_SM4_RT_INPUT = 0x1,
74 WINED3D_SM4_RT_OUTPUT = 0x2,
75 WINED3D_SM4_RT_IMMCONST = 0x4,
76 WINED3D_SM4_RT_CONSTBUFFER = 0x8,
79 enum wined3d_sm4_immconst_type
81 WINED3D_SM4_IMMCONST_FLOAT = 0x1,
82 WINED3D_SM4_IMMCONST_FLOAT4 = 0x2,
85 struct wined3d_sm4_data
87 struct wined3d_shader_version shader_version;
88 const DWORD *end;
89 const struct wined3d_shader_signature *output_signature;
92 struct wined3d_sm4_opcode_info
94 enum wined3d_sm4_opcode opcode;
95 enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
96 UINT dst_count;
97 UINT src_count;
100 struct sysval_map
102 enum wined3d_sysval_semantic sysval;
103 WINED3DSHADER_PARAM_REGISTER_TYPE register_type;
104 UINT register_idx;
107 static const struct wined3d_sm4_opcode_info opcode_table[] =
109 {WINED3D_SM4_OP_ADD, WINED3DSIH_ADD, 1, 2},
110 {WINED3D_SM4_OP_BREAKC, WINED3DSIH_BREAKP, 0, 1},
111 {WINED3D_SM4_OP_DP3, WINED3DSIH_DP3, 1, 2},
112 {WINED3D_SM4_OP_DP4, WINED3DSIH_DP4, 1, 2},
113 {WINED3D_SM4_OP_EMIT, WINED3DSIH_EMIT, 0, 0},
114 {WINED3D_SM4_OP_EXP, WINED3DSIH_EXP, 1, 1},
115 {WINED3D_SM4_OP_IADD, WINED3DSIH_IADD, 1, 2},
116 {WINED3D_SM4_OP_IGE, WINED3DSIH_IGE, 1, 2},
117 {WINED3D_SM4_OP_LOG, WINED3DSIH_LOG, 1, 1},
118 {WINED3D_SM4_OP_LT, WINED3DSIH_LT, 1, 2},
119 {WINED3D_SM4_OP_MIN, WINED3DSIH_MIN, 1, 2},
120 {WINED3D_SM4_OP_MAX, WINED3DSIH_MAX, 1, 2},
121 {WINED3D_SM4_OP_MOV, WINED3DSIH_MOV, 1, 1},
122 {WINED3D_SM4_OP_MUL, WINED3DSIH_MUL, 1, 2},
123 {WINED3D_SM4_OP_RET, WINED3DSIH_RET, 0, 0},
124 {WINED3D_SM4_OP_RSQ, WINED3DSIH_RSQ, 1, 1},
125 {WINED3D_SM4_OP_SINCOS, WINED3DSIH_SINCOS, 1, 2},
128 static const WINED3DSHADER_PARAM_REGISTER_TYPE register_type_table[] =
130 /* WINED3D_SM4_RT_TEMP */ WINED3DSPR_TEMP,
131 /* WINED3D_SM4_RT_INPUT */ WINED3DSPR_INPUT,
132 /* WINED3D_SM4_RT_OUTPUT */ WINED3DSPR_OUTPUT,
133 /* UNKNOWN */ 0,
134 /* WINED3D_SM4_RT_IMMCONST */ WINED3DSPR_IMMCONST,
135 /* UNKNOWN */ 0,
136 /* UNKNOWN */ 0,
137 /* UNKNOWN */ 0,
138 /* WINED3D_SM4_RT_CONSTBUFFER */ WINED3DSPR_CONSTBUFFER,
141 static const struct sysval_map sysval_map[] =
143 {WINED3D_SV_DEPTH, WINED3DSPR_DEPTHOUT, 0},
144 {WINED3D_SV_TARGET0, WINED3DSPR_COLOROUT, 0},
145 {WINED3D_SV_TARGET1, WINED3DSPR_COLOROUT, 1},
146 {WINED3D_SV_TARGET2, WINED3DSPR_COLOROUT, 2},
147 {WINED3D_SV_TARGET3, WINED3DSPR_COLOROUT, 3},
148 {WINED3D_SV_TARGET4, WINED3DSPR_COLOROUT, 4},
149 {WINED3D_SV_TARGET5, WINED3DSPR_COLOROUT, 5},
150 {WINED3D_SV_TARGET6, WINED3DSPR_COLOROUT, 6},
151 {WINED3D_SV_TARGET7, WINED3DSPR_COLOROUT, 7},
154 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
156 unsigned int i;
158 for (i = 0; i < sizeof(opcode_table) / sizeof(*opcode_table); ++i)
160 if (opcode == opcode_table[i].opcode) return &opcode_table[i];
163 return NULL;
166 static void map_sysval(enum wined3d_sysval_semantic sysval, struct wined3d_shader_register *reg)
168 unsigned int i;
170 for (i = 0; i < sizeof(sysval_map) / sizeof(*sysval_map); ++i)
172 if (sysval == sysval_map[i].sysval)
174 reg->type = sysval_map[i].register_type;
175 reg->idx = sysval_map[i].register_idx;
180 static void map_register(struct wined3d_sm4_data *priv, struct wined3d_shader_register *reg)
182 switch (priv->shader_version.type)
184 case WINED3D_SHADER_TYPE_PIXEL:
185 if (reg->type == WINED3DSPR_OUTPUT)
187 unsigned int i;
188 const struct wined3d_shader_signature *s = priv->output_signature;
190 if (!s)
192 ERR("Shader has no output signature, unable to map register.\n");
193 break;
196 for (i = 0; i < s->element_count; ++i)
198 if (s->elements[i].register_idx == reg->idx)
200 map_sysval(s->elements[i].sysval_semantic, reg);
201 break;
205 break;
207 default:
208 break;
212 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
214 struct wined3d_sm4_data *priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv));
215 if (!priv)
217 ERR("Failed to allocate private data\n");
218 return NULL;
221 priv->output_signature = output_signature;
223 return priv;
226 static void shader_sm4_free(void *data)
228 HeapFree(GetProcessHeap(), 0, data);
231 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
233 struct wined3d_sm4_data *priv = data;
234 DWORD version_token;
236 priv->end = *ptr;
238 version_token = *(*ptr)++;
239 TRACE("version: 0x%08x\n", version_token);
241 TRACE("token count: %u\n", **ptr);
242 priv->end += *(*ptr)++;
244 switch (version_token >> 16)
246 case WINED3D_SM4_PS:
247 priv->shader_version.type = WINED3D_SHADER_TYPE_PIXEL;
248 break;
250 case WINED3D_SM4_VS:
251 priv->shader_version.type = WINED3D_SHADER_TYPE_VERTEX;
252 break;
254 case WINED3D_SM4_GS:
255 priv->shader_version.type = WINED3D_SHADER_TYPE_GEOMETRY;
256 break;
258 default:
259 FIXME("Unrecognized shader type %#x\n", version_token >> 16);
261 priv->shader_version.major = WINED3D_SM4_VERSION_MAJOR(version_token);
262 priv->shader_version.minor = WINED3D_SM4_VERSION_MINOR(version_token);
264 *shader_version = priv->shader_version;
267 static void shader_sm4_read_opcode(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins,
268 UINT *param_size)
270 const struct wined3d_sm4_opcode_info *opcode_info;
271 DWORD token = *(*ptr)++;
272 DWORD opcode = token & WINED3D_SM4_OPCODE_MASK;
274 *param_size = ((token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT) - 1;
276 opcode_info = get_opcode_info(opcode);
277 if (!opcode_info)
279 FIXME("Unrecognized opcode %#x, token 0x%08x\n", opcode, token);
280 ins->handler_idx = WINED3DSIH_TABLE_SIZE;
281 return;
284 ins->handler_idx = opcode_info->handler_idx;
285 ins->flags = 0;
286 ins->coissue = 0;
287 ins->predicate = 0;
288 ins->dst_count = opcode_info->dst_count;
289 ins->src_count = opcode_info->src_count;
292 static void shader_sm4_read_src_param(void *data, const DWORD **ptr, struct wined3d_shader_src_param *src_param,
293 struct wined3d_shader_src_param *src_rel_addr)
295 struct wined3d_sm4_data *priv = data;
296 DWORD token = *(*ptr)++;
297 enum wined3d_sm4_register_type register_type;
298 DWORD order;
300 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
301 if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
303 FIXME("Unhandled register type %#x\n", register_type);
304 src_param->reg.type = WINED3DSPR_TEMP;
306 else
308 src_param->reg.type = register_type_table[register_type];
311 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
313 if (order < 1) src_param->reg.idx = ~0U;
314 else src_param->reg.idx = *(*ptr)++;
316 if (order < 2) src_param->reg.array_idx = ~0U;
317 else src_param->reg.array_idx = *(*ptr)++;
319 if (order > 2) FIXME("Unhandled order %u.\n", order);
321 if (register_type == WINED3D_SM4_RT_IMMCONST)
323 enum wined3d_sm4_immconst_type immconst_type =
324 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
325 src_param->swizzle = WINED3DSP_NOSWIZZLE;
327 switch(immconst_type)
329 case WINED3D_SM4_IMMCONST_FLOAT:
330 src_param->reg.immconst_type = WINED3D_IMMCONST_FLOAT;
331 memcpy(src_param->reg.immconst_data, *ptr, 1 * sizeof(DWORD));
332 *ptr += 1;
333 break;
335 case WINED3D_SM4_IMMCONST_FLOAT4:
336 src_param->reg.immconst_type = WINED3D_IMMCONST_FLOAT4;
337 memcpy(src_param->reg.immconst_data, *ptr, 4 * sizeof(DWORD));
338 *ptr += 4;
339 break;
341 default:
342 FIXME("Unhandled immediate constant type %#x\n", immconst_type);
343 break;
346 else
348 src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
351 src_param->modifiers = 0;
352 src_param->reg.rel_addr = NULL;
354 map_register(priv, &src_param->reg);
357 static void shader_sm4_read_dst_param(void *data, const DWORD **ptr, struct wined3d_shader_dst_param *dst_param,
358 struct wined3d_shader_src_param *dst_rel_addr)
360 struct wined3d_sm4_data *priv = data;
361 DWORD token = *(*ptr)++;
362 enum wined3d_sm4_register_type register_type;
363 DWORD order;
365 register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
366 if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
368 FIXME("Unhandled register type %#x\n", register_type);
369 dst_param->reg.type = WINED3DSPR_TEMP;
371 else
373 dst_param->reg.type = register_type_table[register_type];
376 order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
378 if (order < 1) dst_param->reg.idx = ~0U;
379 else dst_param->reg.idx = *(*ptr)++;
381 if (order < 2) dst_param->reg.array_idx = ~0U;
382 else dst_param->reg.array_idx = *(*ptr)++;
384 if (order > 2) FIXME("Unhandled order %u.\n", order);
386 dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
387 dst_param->modifiers = 0;
388 dst_param->shift = 0;
389 dst_param->reg.rel_addr = NULL;
391 map_register(priv, &dst_param->reg);
394 static void shader_sm4_read_semantic(const DWORD **ptr, struct wined3d_shader_semantic *semantic)
396 FIXME("ptr %p, semantic %p stub!\n", ptr, semantic);
399 static void shader_sm4_read_comment(const DWORD **ptr, const char **comment)
401 FIXME("ptr %p, comment %p stub!\n", ptr, comment);
402 *comment = NULL;
405 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
407 struct wined3d_sm4_data *priv = data;
408 return *ptr == priv->end;
411 const struct wined3d_shader_frontend sm4_shader_frontend =
413 shader_sm4_init,
414 shader_sm4_free,
415 shader_sm4_read_header,
416 shader_sm4_read_opcode,
417 shader_sm4_read_src_param,
418 shader_sm4_read_dst_param,
419 shader_sm4_read_semantic,
420 shader_sm4_read_comment,
421 shader_sm4_is_end,