Synchronize with trunk r58457.
[reactos.git] / dll / directx / wine / wined3d / shader_sm4.c
index 5285ae9..5f4d769 100644 (file)
 #include "wined3d_private.h"
 
 WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
+WINE_DECLARE_DEBUG_CHANNEL(d3d_bytecode);
 
 #define WINED3D_SM4_INSTRUCTION_MODIFIER        (1 << 31)
 
 #define WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT    24
 #define WINED3D_SM4_INSTRUCTION_LENGTH_MASK     (0xf << WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT)
 
+#define WINED3D_SM4_PRIMITIVE_TYPE_SHIFT        11
+#define WINED3D_SM4_PRIMITIVE_TYPE_MASK         (0x7 << WINED3D_SM4_PRIMITIVE_TYPE_SHIFT)
+
+#define WINED3D_SM4_INDEX_TYPE_SHIFT            11
+#define WINED3D_SM4_INDEX_TYPE_MASK             (0x1 << WINED3D_SM4_INDEX_TYPE_SHIFT)
+
 #define WINED3D_SM4_OPCODE_MASK                 0xff
 
 #define WINED3D_SM4_REGISTER_MODIFIER           (1 << 31)
 
+#define WINED3D_SM4_ADDRESSING_SHIFT1           25
+#define WINED3D_SM4_ADDRESSING_MASK1            (0x3 << WINED3D_SM4_ADDRESSING_SHIFT1)
+
+#define WINED3D_SM4_ADDRESSING_SHIFT0           22
+#define WINED3D_SM4_ADDRESSING_MASK0            (0x3 << WINED3D_SM4_ADDRESSING_SHIFT0)
+
 #define WINED3D_SM4_REGISTER_ORDER_SHIFT        20
 #define WINED3D_SM4_REGISTER_ORDER_MASK         (0x3 << WINED3D_SM4_REGISTER_ORDER_SHIFT)
 
 #define WINED3D_SM4_REGISTER_TYPE_SHIFT         12
 #define WINED3D_SM4_REGISTER_TYPE_MASK          (0xf << WINED3D_SM4_REGISTER_TYPE_SHIFT)
 
+#define WINED3D_SM4_SWIZZLE_TYPE_SHIFT          2
+#define WINED3D_SM4_SWIZZLE_TYPE_MASK           (0x3 << WINED3D_SM4_SWIZZLE_TYPE_SHIFT)
+
 #define WINED3D_SM4_IMMCONST_TYPE_SHIFT         0
 #define WINED3D_SM4_IMMCONST_TYPE_MASK          (0x3 << WINED3D_SM4_IMMCONST_TYPE_SHIFT)
 
@@ -50,54 +66,61 @@ WINE_DEFAULT_DEBUG_CHANNEL(d3d_shader);
 #define WINED3D_SM4_VERSION_MAJOR(version)      (((version) >> 4) & 0xf)
 #define WINED3D_SM4_VERSION_MINOR(version)      (((version) >> 0) & 0xf)
 
+#define WINED3D_SM4_ADDRESSING_RELATIVE         0x2
+#define WINED3D_SM4_ADDRESSING_OFFSET           0x1
+
 enum wined3d_sm4_opcode
 {
-    WINED3D_SM4_OP_ADD          = 0x00,
-    WINED3D_SM4_OP_AND          = 0x01,
-    WINED3D_SM4_OP_BREAK        = 0x02,
-    WINED3D_SM4_OP_BREAKC       = 0x03,
-    WINED3D_SM4_OP_CUT          = 0x09,
-    WINED3D_SM4_OP_DERIV_RTX    = 0x0b,
-    WINED3D_SM4_OP_DERIV_RTY    = 0x0c,
-    WINED3D_SM4_OP_DIV          = 0x0e,
-    WINED3D_SM4_OP_DP3          = 0x10,
-    WINED3D_SM4_OP_DP4          = 0x11,
-    WINED3D_SM4_OP_EMIT         = 0x13,
-    WINED3D_SM4_OP_ENDIF        = 0x15,
-    WINED3D_SM4_OP_ENDLOOP      = 0x16,
-    WINED3D_SM4_OP_EQ           = 0x18,
-    WINED3D_SM4_OP_EXP          = 0x19,
-    WINED3D_SM4_OP_FRC          = 0x1a,
-    WINED3D_SM4_OP_FTOI         = 0x1b,
-    WINED3D_SM4_OP_GE           = 0x1d,
-    WINED3D_SM4_OP_IADD         = 0x1e,
-    WINED3D_SM4_OP_IF           = 0x1f,
-    WINED3D_SM4_OP_IEQ          = 0x20,
-    WINED3D_SM4_OP_IGE          = 0x21,
-    WINED3D_SM4_OP_IMUL         = 0x26,
-    WINED3D_SM4_OP_ITOF         = 0x2b,
-    WINED3D_SM4_OP_LD           = 0x2d,
-    WINED3D_SM4_OP_LOG          = 0x2f,
-    WINED3D_SM4_OP_LOOP         = 0x30,
-    WINED3D_SM4_OP_LT           = 0x31,
-    WINED3D_SM4_OP_MAD          = 0x32,
-    WINED3D_SM4_OP_MIN          = 0x33,
-    WINED3D_SM4_OP_MAX          = 0x34,
-    WINED3D_SM4_OP_MOV          = 0x36,
-    WINED3D_SM4_OP_MOVC         = 0x37,
-    WINED3D_SM4_OP_MUL          = 0x38,
-    WINED3D_SM4_OP_RET          = 0x3e,
-    WINED3D_SM4_OP_ROUND_NI     = 0x41,
-    WINED3D_SM4_OP_RSQ          = 0x44,
-    WINED3D_SM4_OP_SAMPLE       = 0x45,
-    WINED3D_SM4_OP_SAMPLE_LOD   = 0x48,
-    WINED3D_SM4_OP_SAMPLE_GRAD  = 0x49,
-    WINED3D_SM4_OP_SQRT         = 0x4b,
-    WINED3D_SM4_OP_SINCOS       = 0x4d,
-    WINED3D_SM4_OP_UDIV         = 0x4e,
-    WINED3D_SM4_OP_USHR         = 0x55,
-    WINED3D_SM4_OP_UTOF         = 0x56,
-    WINED3D_SM4_OP_XOR          = 0x57,
+    WINED3D_SM4_OP_ADD                  = 0x00,
+    WINED3D_SM4_OP_AND                  = 0x01,
+    WINED3D_SM4_OP_BREAK                = 0x02,
+    WINED3D_SM4_OP_BREAKC               = 0x03,
+    WINED3D_SM4_OP_CUT                  = 0x09,
+    WINED3D_SM4_OP_DERIV_RTX            = 0x0b,
+    WINED3D_SM4_OP_DERIV_RTY            = 0x0c,
+    WINED3D_SM4_OP_DIV                  = 0x0e,
+    WINED3D_SM4_OP_DP3                  = 0x10,
+    WINED3D_SM4_OP_DP4                  = 0x11,
+    WINED3D_SM4_OP_EMIT                 = 0x13,
+    WINED3D_SM4_OP_ENDIF                = 0x15,
+    WINED3D_SM4_OP_ENDLOOP              = 0x16,
+    WINED3D_SM4_OP_EQ                   = 0x18,
+    WINED3D_SM4_OP_EXP                  = 0x19,
+    WINED3D_SM4_OP_FRC                  = 0x1a,
+    WINED3D_SM4_OP_FTOI                 = 0x1b,
+    WINED3D_SM4_OP_GE                   = 0x1d,
+    WINED3D_SM4_OP_IADD                 = 0x1e,
+    WINED3D_SM4_OP_IF                   = 0x1f,
+    WINED3D_SM4_OP_IEQ                  = 0x20,
+    WINED3D_SM4_OP_IGE                  = 0x21,
+    WINED3D_SM4_OP_IMUL                 = 0x26,
+    WINED3D_SM4_OP_ITOF                 = 0x2b,
+    WINED3D_SM4_OP_LD                   = 0x2d,
+    WINED3D_SM4_OP_LOG                  = 0x2f,
+    WINED3D_SM4_OP_LOOP                 = 0x30,
+    WINED3D_SM4_OP_LT                   = 0x31,
+    WINED3D_SM4_OP_MAD                  = 0x32,
+    WINED3D_SM4_OP_MIN                  = 0x33,
+    WINED3D_SM4_OP_MAX                  = 0x34,
+    WINED3D_SM4_OP_MOV                  = 0x36,
+    WINED3D_SM4_OP_MOVC                 = 0x37,
+    WINED3D_SM4_OP_MUL                  = 0x38,
+    WINED3D_SM4_OP_RET                  = 0x3e,
+    WINED3D_SM4_OP_ROUND_NI             = 0x41,
+    WINED3D_SM4_OP_RSQ                  = 0x44,
+    WINED3D_SM4_OP_SAMPLE               = 0x45,
+    WINED3D_SM4_OP_SAMPLE_LOD           = 0x48,
+    WINED3D_SM4_OP_SAMPLE_GRAD          = 0x49,
+    WINED3D_SM4_OP_SQRT                 = 0x4b,
+    WINED3D_SM4_OP_SINCOS               = 0x4d,
+    WINED3D_SM4_OP_UDIV                 = 0x4e,
+    WINED3D_SM4_OP_USHR                 = 0x55,
+    WINED3D_SM4_OP_UTOF                 = 0x56,
+    WINED3D_SM4_OP_XOR                  = 0x57,
+    WINED3D_SM4_OP_DCL_CONSTANT_BUFFER  = 0x59,
+    WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY  = 0x5c,
+    WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE  = 0x5d,
+    WINED3D_SM4_OP_DCL_VERTICES_OUT     = 0x5e,
 };
 
 enum wined3d_sm4_register_type
@@ -108,28 +131,62 @@ enum wined3d_sm4_register_type
     WINED3D_SM4_RT_IMMCONST     = 0x4,
     WINED3D_SM4_RT_SAMPLER      = 0x6,
     WINED3D_SM4_RT_CONSTBUFFER  = 0x8,
+    WINED3D_SM4_RT_PRIMID       = 0xb,
     WINED3D_SM4_RT_NULL         = 0xd,
 };
 
+enum wined3d_sm4_output_primitive_type
+{
+    WINED3D_SM4_OUTPUT_PT_POINTLIST     = 0x1,
+    WINED3D_SM4_OUTPUT_PT_LINELIST      = 0x3,
+    WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP = 0x5,
+};
+
+enum wined3d_sm4_input_primitive_type
+{
+    WINED3D_SM4_INPUT_PT_POINT          = 0x1,
+    WINED3D_SM4_INPUT_PT_LINE           = 0x2,
+    WINED3D_SM4_INPUT_PT_TRIANGLE       = 0x3,
+    WINED3D_SM4_INPUT_PT_LINEADJ        = 0x6,
+    WINED3D_SM4_INPUT_PT_TRIANGLEADJ    = 0x7,
+};
+
+enum wined3d_sm4_swizzle_type
+{
+    WINED3D_SM4_SWIZZLE_VEC4            = 0x1,
+    WINED3D_SM4_SWIZZLE_SCALAR          = 0x2,
+};
+
 enum wined3d_sm4_immconst_type
 {
     WINED3D_SM4_IMMCONST_SCALAR = 0x1,
     WINED3D_SM4_IMMCONST_VEC4   = 0x2,
 };
 
+struct wined3d_shader_src_param_entry
+{
+    struct list entry;
+    struct wined3d_shader_src_param param;
+};
+
 struct wined3d_sm4_data
 {
     struct wined3d_shader_version shader_version;
     const DWORD *end;
     const struct wined3d_shader_signature *output_signature;
+
+    struct wined3d_shader_src_param src_param[5];
+    struct wined3d_shader_dst_param dst_param[2];
+    struct list src_free;
+    struct list src;
 };
 
 struct wined3d_sm4_opcode_info
 {
     enum wined3d_sm4_opcode opcode;
     enum WINED3D_SHADER_INSTRUCTION_HANDLER handler_idx;
-    UINT dst_count;
-    UINT src_count;
+    const char *dst_info;
+    const char *src_info;
 };
 
 struct sysval_map
@@ -139,54 +196,65 @@ struct sysval_map
     UINT register_idx;
 };
 
+/*
+ * F -> WINED3D_DATA_FLOAT
+ * I -> WINED3D_DATA_INT
+ * R -> WINED3D_DATA_RESOURCE
+ * S -> WINED3D_DATA_SAMPLER
+ * U -> WINED3D_DATA_UINT
+ */
 static const struct wined3d_sm4_opcode_info opcode_table[] =
 {
-    {WINED3D_SM4_OP_ADD,        WINED3DSIH_ADD,         1,  2},
-    {WINED3D_SM4_OP_AND,        WINED3DSIH_AND,         1,  2},
-    {WINED3D_SM4_OP_BREAK,      WINED3DSIH_BREAK,       0,  0},
-    {WINED3D_SM4_OP_BREAKC,     WINED3DSIH_BREAKP,      0,  1},
-    {WINED3D_SM4_OP_CUT,        WINED3DSIH_CUT,         0,  0},
-    {WINED3D_SM4_OP_DERIV_RTX,  WINED3DSIH_DSX,         1,  1},
-    {WINED3D_SM4_OP_DERIV_RTY,  WINED3DSIH_DSY,         1,  1},
-    {WINED3D_SM4_OP_DIV,        WINED3DSIH_DIV,         1,  2},
-    {WINED3D_SM4_OP_DP3,        WINED3DSIH_DP3,         1,  2},
-    {WINED3D_SM4_OP_DP4,        WINED3DSIH_DP4,         1,  2},
-    {WINED3D_SM4_OP_EMIT,       WINED3DSIH_EMIT,        0,  0},
-    {WINED3D_SM4_OP_ENDIF,      WINED3DSIH_ENDIF,       0,  0},
-    {WINED3D_SM4_OP_ENDLOOP,    WINED3DSIH_ENDLOOP,     0,  0},
-    {WINED3D_SM4_OP_EQ,         WINED3DSIH_EQ,          1,  2},
-    {WINED3D_SM4_OP_EXP,        WINED3DSIH_EXP,         1,  1},
-    {WINED3D_SM4_OP_FRC,        WINED3DSIH_FRC,         1,  1},
-    {WINED3D_SM4_OP_FTOI,       WINED3DSIH_FTOI,        1,  1},
-    {WINED3D_SM4_OP_GE,         WINED3DSIH_GE,          1,  2},
-    {WINED3D_SM4_OP_IADD,       WINED3DSIH_IADD,        1,  2},
-    {WINED3D_SM4_OP_IF,         WINED3DSIH_IF,          0,  1},
-    {WINED3D_SM4_OP_IEQ,        WINED3DSIH_IEQ,         1,  2},
-    {WINED3D_SM4_OP_IGE,        WINED3DSIH_IGE,         1,  2},
-    {WINED3D_SM4_OP_IMUL,       WINED3DSIH_IMUL,        2,  2},
-    {WINED3D_SM4_OP_ITOF,       WINED3DSIH_ITOF,        1,  1},
-    {WINED3D_SM4_OP_LD,         WINED3DSIH_LD,          1,  2},
-    {WINED3D_SM4_OP_LOG,        WINED3DSIH_LOG,         1,  1},
-    {WINED3D_SM4_OP_LOOP,       WINED3DSIH_LOOP,        0,  0},
-    {WINED3D_SM4_OP_LT,         WINED3DSIH_LT,          1,  2},
-    {WINED3D_SM4_OP_MAD,        WINED3DSIH_MAD,         1,  3},
-    {WINED3D_SM4_OP_MIN,        WINED3DSIH_MIN,         1,  2},
-    {WINED3D_SM4_OP_MAX,        WINED3DSIH_MAX,         1,  2},
-    {WINED3D_SM4_OP_MOV,        WINED3DSIH_MOV,         1,  1},
-    {WINED3D_SM4_OP_MOVC,       WINED3DSIH_MOVC,        1,  3},
-    {WINED3D_SM4_OP_MUL,        WINED3DSIH_MUL,         1,  2},
-    {WINED3D_SM4_OP_RET,        WINED3DSIH_RET,         0,  0},
-    {WINED3D_SM4_OP_ROUND_NI,   WINED3DSIH_ROUND_NI,    1,  1},
-    {WINED3D_SM4_OP_RSQ,        WINED3DSIH_RSQ,         1,  1},
-    {WINED3D_SM4_OP_SAMPLE,     WINED3DSIH_SAMPLE,      1,  3},
-    {WINED3D_SM4_OP_SAMPLE_LOD, WINED3DSIH_SAMPLE_LOD,  1,  4},
-    {WINED3D_SM4_OP_SAMPLE_GRAD,WINED3DSIH_SAMPLE_GRAD, 1,  5},
-    {WINED3D_SM4_OP_SQRT,       WINED3DSIH_SQRT,        1,  1},
-    {WINED3D_SM4_OP_SINCOS,     WINED3DSIH_SINCOS,      2,  1},
-    {WINED3D_SM4_OP_UDIV,       WINED3DSIH_UDIV,        2,  2},
-    {WINED3D_SM4_OP_USHR,       WINED3DSIH_USHR,        1,  2},
-    {WINED3D_SM4_OP_UTOF,       WINED3DSIH_UTOF,        1,  1},
-    {WINED3D_SM4_OP_XOR,        WINED3DSIH_XOR,         1,  2},
+    {WINED3D_SM4_OP_ADD,                    WINED3DSIH_ADD,                 "F",    "FF"},
+    {WINED3D_SM4_OP_AND,                    WINED3DSIH_AND,                 "U",    "UU"},
+    {WINED3D_SM4_OP_BREAK,                  WINED3DSIH_BREAK,               "",     ""},
+    {WINED3D_SM4_OP_BREAKC,                 WINED3DSIH_BREAKP,              "",     "U"},
+    {WINED3D_SM4_OP_CUT,                    WINED3DSIH_CUT,                 "",     ""},
+    {WINED3D_SM4_OP_DERIV_RTX,              WINED3DSIH_DSX,                 "F",    "F"},
+    {WINED3D_SM4_OP_DERIV_RTY,              WINED3DSIH_DSY,                 "F",    "F"},
+    {WINED3D_SM4_OP_DIV,                    WINED3DSIH_DIV,                 "F",    "FF"},
+    {WINED3D_SM4_OP_DP3,                    WINED3DSIH_DP3,                 "F",    "FF"},
+    {WINED3D_SM4_OP_DP4,                    WINED3DSIH_DP4,                 "F",    "FF"},
+    {WINED3D_SM4_OP_EMIT,                   WINED3DSIH_EMIT,                "",     ""},
+    {WINED3D_SM4_OP_ENDIF,                  WINED3DSIH_ENDIF,               "",     ""},
+    {WINED3D_SM4_OP_ENDLOOP,                WINED3DSIH_ENDLOOP,             "",     ""},
+    {WINED3D_SM4_OP_EQ,                     WINED3DSIH_EQ,                  "U",    "FF"},
+    {WINED3D_SM4_OP_EXP,                    WINED3DSIH_EXP,                 "F",    "F"},
+    {WINED3D_SM4_OP_FRC,                    WINED3DSIH_FRC,                 "F",    "F"},
+    {WINED3D_SM4_OP_FTOI,                   WINED3DSIH_FTOI,                "I",    "F"},
+    {WINED3D_SM4_OP_GE,                     WINED3DSIH_GE,                  "U",    "FF"},
+    {WINED3D_SM4_OP_IADD,                   WINED3DSIH_IADD,                "I",    "II"},
+    {WINED3D_SM4_OP_IF,                     WINED3DSIH_IF,                  "",     "U"},
+    {WINED3D_SM4_OP_IEQ,                    WINED3DSIH_IEQ,                 "U",    "II"},
+    {WINED3D_SM4_OP_IGE,                    WINED3DSIH_IGE,                 "U",    "II"},
+    {WINED3D_SM4_OP_IMUL,                   WINED3DSIH_IMUL,                "II",   "II"},
+    {WINED3D_SM4_OP_ITOF,                   WINED3DSIH_ITOF,                "F",    "I"},
+    {WINED3D_SM4_OP_LD,                     WINED3DSIH_LD,                  "U",    "FR"},
+    {WINED3D_SM4_OP_LOG,                    WINED3DSIH_LOG,                 "F",    "F"},
+    {WINED3D_SM4_OP_LOOP,                   WINED3DSIH_LOOP,                "",     ""},
+    {WINED3D_SM4_OP_LT,                     WINED3DSIH_LT,                  "U",    "FF"},
+    {WINED3D_SM4_OP_MAD,                    WINED3DSIH_MAD,                 "F",    "FFF"},
+    {WINED3D_SM4_OP_MIN,                    WINED3DSIH_MIN,                 "F",    "FF"},
+    {WINED3D_SM4_OP_MAX,                    WINED3DSIH_MAX,                 "F",    "FF"},
+    {WINED3D_SM4_OP_MOV,                    WINED3DSIH_MOV,                 "F",    "F"},
+    {WINED3D_SM4_OP_MOVC,                   WINED3DSIH_MOVC,                "F",    "UFF"},
+    {WINED3D_SM4_OP_MUL,                    WINED3DSIH_MUL,                 "F",    "FF"},
+    {WINED3D_SM4_OP_RET,                    WINED3DSIH_RET,                 "",     ""},
+    {WINED3D_SM4_OP_ROUND_NI,               WINED3DSIH_ROUND_NI,            "F",    "F"},
+    {WINED3D_SM4_OP_RSQ,                    WINED3DSIH_RSQ,                 "F",    "F"},
+    {WINED3D_SM4_OP_SAMPLE,                 WINED3DSIH_SAMPLE,              "U",    "FRS"},
+    {WINED3D_SM4_OP_SAMPLE_LOD,             WINED3DSIH_SAMPLE_LOD,          "U",    "FRSF"},
+    {WINED3D_SM4_OP_SAMPLE_GRAD,            WINED3DSIH_SAMPLE_GRAD,         "U",    "FRSFF"},
+    {WINED3D_SM4_OP_SQRT,                   WINED3DSIH_SQRT,                "F",    "F"},
+    {WINED3D_SM4_OP_SINCOS,                 WINED3DSIH_SINCOS,              "FF",   "F"},
+    {WINED3D_SM4_OP_UDIV,                   WINED3DSIH_UDIV,                "UU",   "UU"},
+    {WINED3D_SM4_OP_USHR,                   WINED3DSIH_USHR,                "U",    "UU"},
+    {WINED3D_SM4_OP_UTOF,                   WINED3DSIH_UTOF,                "F",    "U"},
+    {WINED3D_SM4_OP_XOR,                    WINED3DSIH_XOR,                 "U",    "UU"},
+    {WINED3D_SM4_OP_DCL_CONSTANT_BUFFER,    WINED3DSIH_DCL_CONSTANT_BUFFER, "",     ""},
+    {WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY,    WINED3DSIH_DCL_OUTPUT_TOPOLOGY, "",     ""},
+    {WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE,    WINED3DSIH_DCL_INPUT_PRIMITIVE, "",     ""},
+    {WINED3D_SM4_OP_DCL_VERTICES_OUT,       WINED3DSIH_DCL_VERTICES_OUT,    "",     ""},
 };
 
 static const enum wined3d_shader_register_type register_type_table[] =
@@ -202,11 +270,33 @@ static const enum wined3d_shader_register_type register_type_table[] =
     /* WINED3D_SM4_RT_CONSTBUFFER */    WINED3DSPR_CONSTBUFFER,
     /* UNKNOWN */                       0,
     /* UNKNOWN */                       0,
-    /* UNKNOWN */                       0,
+    /* WINED3D_SM4_RT_PRIMID */         WINED3DSPR_PRIMID,
     /* UNKNOWN */                       0,
     /* WINED3D_SM4_RT_NULL */           WINED3DSPR_NULL,
 };
 
+static const enum wined3d_primitive_type output_primitive_type_table[] =
+{
+    /* UNKNOWN */                               WINED3D_PT_UNDEFINED,
+    /* WINED3D_SM4_OUTPUT_PT_POINTLIST */       WINED3D_PT_POINTLIST,
+    /* UNKNOWN */                               WINED3D_PT_UNDEFINED,
+    /* WINED3D_SM4_OUTPUT_PT_LINELIST */        WINED3D_PT_LINELIST,
+    /* UNKNOWN */                               WINED3D_PT_UNDEFINED,
+    /* WINED3D_SM4_OUTPUT_PT_TRIANGLESTRIP */   WINED3D_PT_TRIANGLESTRIP,
+};
+
+static const enum wined3d_primitive_type input_primitive_type_table[] =
+{
+    /* UNKNOWN */                               WINED3D_PT_UNDEFINED,
+    /* WINED3D_SM4_INPUT_PT_POINT */            WINED3D_PT_POINTLIST,
+    /* WINED3D_SM4_INPUT_PT_LINE */             WINED3D_PT_LINELIST,
+    /* WINED3D_SM4_INPUT_PT_TRIANGLE */         WINED3D_PT_TRIANGLELIST,
+    /* UNKNOWN */                               WINED3D_PT_UNDEFINED,
+    /* UNKNOWN */                               WINED3D_PT_UNDEFINED,
+    /* WINED3D_SM4_INPUT_PT_LINEADJ */          WINED3D_PT_LINELIST_ADJ,
+    /* WINED3D_SM4_INPUT_PT_TRIANGLEADJ */      WINED3D_PT_TRIANGLELIST_ADJ,
+};
+
 static const struct sysval_map sysval_map[] =
 {
     {WINED3D_SV_DEPTH,      WINED3DSPR_DEPTHOUT,    0},
@@ -220,6 +310,9 @@ static const struct sysval_map sysval_map[] =
     {WINED3D_SV_TARGET7,    WINED3DSPR_COLOROUT,    7},
 };
 
+static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
+        enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param);
+
 static const struct wined3d_sm4_opcode_info *get_opcode_info(enum wined3d_sm4_opcode opcode)
 {
     unsigned int i;
@@ -241,7 +334,7 @@ static void map_sysval(enum wined3d_sysval_semantic sysval, struct wined3d_shade
         if (sysval == sysval_map[i].sysval)
         {
             reg->type = sysval_map[i].register_type;
-            reg->idx = sysval_map[i].register_idx;
+            reg->idx[0].offset = sysval_map[i].register_idx;
         }
     }
 }
@@ -264,7 +357,7 @@ static void map_register(const struct wined3d_sm4_data *priv, struct wined3d_sha
 
                 for (i = 0; i < s->element_count; ++i)
                 {
-                    if (s->elements[i].register_idx == reg->idx)
+                    if (s->elements[i].register_idx == reg->idx[0].offset)
                     {
                         map_sysval(s->elements[i].sysval_semantic, reg);
                         break;
@@ -278,6 +371,26 @@ static void map_register(const struct wined3d_sm4_data *priv, struct wined3d_sha
     }
 }
 
+static enum wined3d_data_type map_data_type(char t)
+{
+    switch (t)
+    {
+        case 'F':
+            return WINED3D_DATA_FLOAT;
+        case 'I':
+            return WINED3D_DATA_INT;
+        case 'R':
+            return WINED3D_DATA_RESOURCE;
+        case 'S':
+            return WINED3D_DATA_SAMPLER;
+        case 'U':
+            return WINED3D_DATA_UINT;
+        default:
+            ERR("Invalid data type '%c'.\n", t);
+            return WINED3D_DATA_FLOAT;
+    }
+}
+
 static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader_signature *output_signature)
 {
     struct wined3d_sm4_data *priv = HeapAlloc(GetProcessHeap(), 0, sizeof(*priv));
@@ -288,13 +401,45 @@ static void *shader_sm4_init(const DWORD *byte_code, const struct wined3d_shader
     }
 
     priv->output_signature = output_signature;
+    list_init(&priv->src_free);
+    list_init(&priv->src);
 
     return priv;
 }
 
 static void shader_sm4_free(void *data)
 {
-    HeapFree(GetProcessHeap(), 0, data);
+    struct wined3d_shader_src_param_entry *e1, *e2;
+    struct wined3d_sm4_data *priv = data;
+
+    list_move_head(&priv->src_free, &priv->src);
+    LIST_FOR_EACH_ENTRY_SAFE(e1, e2, &priv->src_free, struct wined3d_shader_src_param_entry, entry)
+    {
+        HeapFree(GetProcessHeap(), 0, e1);
+    }
+    HeapFree(GetProcessHeap(), 0, priv);
+}
+
+static struct wined3d_shader_src_param *get_src_param(struct wined3d_sm4_data *priv)
+{
+    struct wined3d_shader_src_param_entry *e;
+    struct list *elem;
+
+    if (!list_empty(&priv->src_free))
+    {
+        elem = list_head(&priv->src_free);
+        list_remove(elem);
+    }
+    else
+    {
+        if (!(e = HeapAlloc(GetProcessHeap(), 0, sizeof(*e))))
+            return NULL;
+        elem = &e->entry;
+    }
+
+    list_add_tail(&priv->src, elem);
+    e = LIST_ENTRY(elem, struct wined3d_shader_src_param_entry, entry);
+    return &e->param;
 }
 
 static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d_shader_version *shader_version)
@@ -333,175 +478,316 @@ static void shader_sm4_read_header(void *data, const DWORD **ptr, struct wined3d
     *shader_version = priv->shader_version;
 }
 
-static void shader_sm4_read_opcode(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins,
-        UINT *param_size)
+static BOOL shader_sm4_read_reg_idx(struct wined3d_sm4_data *priv, const DWORD **ptr,
+        DWORD addressing, struct wined3d_shader_register_index *reg_idx)
 {
-    const struct wined3d_sm4_opcode_info *opcode_info;
-    DWORD token = *(*ptr)++;
-    DWORD opcode = token & WINED3D_SM4_OPCODE_MASK;
-
-    *param_size = ((token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT) - 1;
-
-    opcode_info = get_opcode_info(opcode);
-    if (!opcode_info)
+    if (addressing & WINED3D_SM4_ADDRESSING_RELATIVE)
     {
-        FIXME("Unrecognized opcode %#x, token 0x%08x\n", opcode, token);
-        ins->handler_idx = WINED3DSIH_TABLE_SIZE;
-        return;
-    }
+        struct wined3d_shader_src_param *rel_addr = get_src_param(priv);
 
-    ins->handler_idx = opcode_info->handler_idx;
-    ins->flags = 0;
-    ins->coissue = 0;
-    ins->predicate = 0;
-    ins->dst_count = opcode_info->dst_count;
-    ins->src_count = opcode_info->src_count;
+        if (!(reg_idx->rel_addr = rel_addr))
+        {
+            ERR("Failed to get src param for relative addressing.\n");
+            return FALSE;
+        }
 
-    if (token & WINED3D_SM4_INSTRUCTION_MODIFIER)
+        if (addressing & WINED3D_SM4_ADDRESSING_OFFSET)
+            reg_idx->offset = *(*ptr)++;
+        else
+            reg_idx->offset = 0;
+        shader_sm4_read_src_param(priv, ptr, WINED3D_DATA_INT, rel_addr);
+    }
+    else
     {
-        DWORD modifier = *(*ptr)++;
-        FIXME("Skipping modifier 0x%08x.\n", modifier);
+        reg_idx->rel_addr = NULL;
+        reg_idx->offset = *(*ptr)++;
     }
+
+    return TRUE;
 }
 
-static void shader_sm4_read_src_param(void *data, const DWORD **ptr, struct wined3d_shader_src_param *src_param,
-        struct wined3d_shader_src_param *src_rel_addr)
+static BOOL shader_sm4_read_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
+        enum wined3d_data_type data_type, struct wined3d_shader_register *param,
+        enum wined3d_shader_src_modifier *modifier)
 {
-    struct wined3d_sm4_data *priv = data;
-    DWORD token = *(*ptr)++;
     enum wined3d_sm4_register_type register_type;
+    DWORD token = *(*ptr)++;
     DWORD order;
 
     register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
     if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
     {
-        FIXME("Unhandled register type %#x\n", register_type);
-        src_param->reg.type = WINED3DSPR_TEMP;
+        FIXME("Unhandled register type %#x.\n", register_type);
+        param->type = WINED3DSPR_TEMP;
     }
     else
     {
-        src_param->reg.type = register_type_table[register_type];
+        param->type = register_type_table[register_type];
     }
+    param->data_type = data_type;
 
     if (token & WINED3D_SM4_REGISTER_MODIFIER)
     {
-        DWORD modifier = *(*ptr)++;
+        DWORD m = *(*ptr)++;
 
         /* FIXME: This will probably break down at some point. The SM4
          * modifiers look like flags, while wined3d currently has an enum
          * with possible combinations, e.g. WINED3DSPSM_ABSNEG. */
-        switch (modifier)
+        switch (m)
         {
             case 0x41:
-                src_param->modifiers = WINED3DSPSM_NEG;
+                *modifier = WINED3DSPSM_NEG;
                 break;
 
             case 0x81:
-                src_param->modifiers = WINED3DSPSM_ABS;
+                *modifier = WINED3DSPSM_ABS;
                 break;
 
             default:
-                FIXME("Skipping modifier 0x%08x.\n", modifier);
-                src_param->modifiers = WINED3DSPSM_NONE;
+                FIXME("Skipping modifier 0x%08x.\n", m);
+                *modifier = WINED3DSPSM_NONE;
                 break;
         }
     }
     else
     {
-        src_param->modifiers = WINED3DSPSM_NONE;
+        *modifier = WINED3DSPSM_NONE;
     }
 
     order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
 
-    if (order < 1) src_param->reg.idx = ~0U;
-    else src_param->reg.idx = *(*ptr)++;
+    if (order < 1)
+        param->idx[0].offset = ~0U;
+    else
+    {
+        DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK0) >> WINED3D_SM4_ADDRESSING_SHIFT0;
+        if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[0])))
+        {
+            ERR("Failed to read register index.\n");
+            return FALSE;
+        }
+    }
 
-    if (order < 2) src_param->reg.array_idx = ~0U;
-    else src_param->reg.array_idx = *(*ptr)++;
+    if (order < 2)
+        param->idx[1].offset = ~0U;
+    else
+    {
+        DWORD addressing = (token & WINED3D_SM4_ADDRESSING_MASK1) >> WINED3D_SM4_ADDRESSING_SHIFT1;
+        if (!(shader_sm4_read_reg_idx(priv, ptr, addressing, &param->idx[1])))
+        {
+            ERR("Failed to read register index.\n");
+            return FALSE;
+        }
+    }
 
-    if (order > 2) FIXME("Unhandled order %u.\n", order);
+    if (order > 2)
+        FIXME("Unhandled order %u.\n", order);
 
     if (register_type == WINED3D_SM4_RT_IMMCONST)
     {
         enum wined3d_sm4_immconst_type immconst_type =
                 (token & WINED3D_SM4_IMMCONST_TYPE_MASK) >> WINED3D_SM4_IMMCONST_TYPE_SHIFT;
-        src_param->swizzle = WINED3DSP_NOSWIZZLE;
 
-        switch(immconst_type)
+        switch (immconst_type)
         {
             case WINED3D_SM4_IMMCONST_SCALAR:
-                src_param->reg.immconst_type = WINED3D_IMMCONST_SCALAR;
-                memcpy(src_param->reg.immconst_data, *ptr, 1 * sizeof(DWORD));
+                param->immconst_type = WINED3D_IMMCONST_SCALAR;
+                memcpy(param->immconst_data, *ptr, 1 * sizeof(DWORD));
                 *ptr += 1;
                 break;
 
             case WINED3D_SM4_IMMCONST_VEC4:
-                src_param->reg.immconst_type = WINED3D_IMMCONST_VEC4;
-                memcpy(src_param->reg.immconst_data, *ptr, 4 * sizeof(DWORD));
+                param->immconst_type = WINED3D_IMMCONST_VEC4;
+                memcpy(param->immconst_data, *ptr, 4 * sizeof(DWORD));
                 *ptr += 4;
                 break;
 
             default:
-                FIXME("Unhandled immediate constant type %#x\n", immconst_type);
+                FIXME("Unhandled immediate constant type %#x.\n", immconst_type);
                 break;
         }
     }
-    else
-    {
-        src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
-    }
 
-    src_param->reg.rel_addr = NULL;
+    map_register(priv, param);
 
-    map_register(priv, &src_param->reg);
+    return TRUE;
 }
 
-static void shader_sm4_read_dst_param(void *data, const DWORD **ptr, struct wined3d_shader_dst_param *dst_param,
-        struct wined3d_shader_src_param *dst_rel_addr)
+static BOOL shader_sm4_read_src_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
+        enum wined3d_data_type data_type, struct wined3d_shader_src_param *src_param)
 {
-    struct wined3d_sm4_data *priv = data;
-    DWORD token = *(*ptr)++;
-    enum wined3d_sm4_register_type register_type;
-    DWORD order;
+    DWORD token = **ptr;
 
-    register_type = (token & WINED3D_SM4_REGISTER_TYPE_MASK) >> WINED3D_SM4_REGISTER_TYPE_SHIFT;
-    if (register_type >= sizeof(register_type_table) / sizeof(*register_type_table))
+    if (!shader_sm4_read_param(priv, ptr, data_type, &src_param->reg, &src_param->modifiers))
     {
-        FIXME("Unhandled register type %#x\n", register_type);
-        dst_param->reg.type = WINED3DSPR_TEMP;
+        ERR("Failed to read parameter.\n");
+        return FALSE;
+    }
+
+    if (src_param->reg.type == WINED3DSPR_IMMCONST)
+    {
+        src_param->swizzle = WINED3DSP_NOSWIZZLE;
     }
     else
     {
-        dst_param->reg.type = register_type_table[register_type];
+        enum wined3d_sm4_swizzle_type swizzle_type =
+                (token & WINED3D_SM4_SWIZZLE_TYPE_MASK) >> WINED3D_SM4_SWIZZLE_TYPE_SHIFT;
+
+        switch (swizzle_type)
+        {
+            case WINED3D_SM4_SWIZZLE_SCALAR:
+                src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
+                src_param->swizzle = (src_param->swizzle & 0x3) * 0x55;
+                break;
+
+            case WINED3D_SM4_SWIZZLE_VEC4:
+                src_param->swizzle = (token & WINED3D_SM4_SWIZZLE_MASK) >> WINED3D_SM4_SWIZZLE_SHIFT;
+                break;
+
+            default:
+                FIXME("Unhandled swizzle type %#x.\n", swizzle_type);
+                break;
+        }
     }
 
-    order = (token & WINED3D_SM4_REGISTER_ORDER_MASK) >> WINED3D_SM4_REGISTER_ORDER_SHIFT;
+    return TRUE;
+}
 
-    if (order < 1) dst_param->reg.idx = ~0U;
-    else dst_param->reg.idx = *(*ptr)++;
+static BOOL shader_sm4_read_dst_param(struct wined3d_sm4_data *priv, const DWORD **ptr,
+        enum wined3d_data_type data_type, struct wined3d_shader_dst_param *dst_param)
+{
+    enum wined3d_shader_src_modifier modifier;
+    DWORD token = **ptr;
 
-    if (order < 2) dst_param->reg.array_idx = ~0U;
-    else dst_param->reg.array_idx = *(*ptr)++;
+    if (!shader_sm4_read_param(priv, ptr, data_type, &dst_param->reg, &modifier))
+    {
+        ERR("Failed to read parameter.\n");
+        return FALSE;
+    }
 
-    if (order > 2) FIXME("Unhandled order %u.\n", order);
+    if (modifier != WINED3DSPSM_NONE)
+    {
+        ERR("Invalid source modifier %#x on destination register.\n", modifier);
+        return FALSE;
+    }
 
     dst_param->write_mask = (token & WINED3D_SM4_WRITEMASK_MASK) >> WINED3D_SM4_WRITEMASK_SHIFT;
     dst_param->modifiers = 0;
     dst_param->shift = 0;
-    dst_param->reg.rel_addr = NULL;
 
-    map_register(priv, &dst_param->reg);
+    return TRUE;
 }
 
-static void shader_sm4_read_semantic(const DWORD **ptr, struct wined3d_shader_semantic *semantic)
+static void shader_sm4_read_instruction(void *data, const DWORD **ptr, struct wined3d_shader_instruction *ins)
 {
-    FIXME("ptr %p, semantic %p stub!\n", ptr, semantic);
-}
+    const struct wined3d_sm4_opcode_info *opcode_info;
+    struct wined3d_sm4_data *priv = data;
+    DWORD opcode_token, opcode;
+    const DWORD *p;
+    UINT i, len;
 
-static void shader_sm4_read_comment(const DWORD **ptr, const char **comment, UINT *comment_size)
-{
-    FIXME("ptr %p, comment %p, comment_size %p stub!\n", ptr, comment, comment_size);
-    *comment = NULL;
+    list_move_head(&priv->src_free, &priv->src);
+
+    opcode_token = *(*ptr)++;
+    opcode = opcode_token & WINED3D_SM4_OPCODE_MASK;
+    len = ((opcode_token & WINED3D_SM4_INSTRUCTION_LENGTH_MASK) >> WINED3D_SM4_INSTRUCTION_LENGTH_SHIFT) - 1;
+
+    if (TRACE_ON(d3d_bytecode))
+    {
+        TRACE_(d3d_bytecode)("[ %08x ", opcode_token);
+        for (i = 0; i < len; ++i)
+        {
+            TRACE_(d3d_bytecode)("%08x ", (*ptr)[i]);
+        }
+        TRACE_(d3d_bytecode)("]\n");
+    }
+
+    if (!(opcode_info = get_opcode_info(opcode)))
+    {
+        FIXME("Unrecognized opcode %#x, opcode_token 0x%08x.\n", opcode, opcode_token);
+        ins->handler_idx = WINED3DSIH_TABLE_SIZE;
+        *ptr += len;
+        return;
+    }
+
+    ins->handler_idx = opcode_info->handler_idx;
+    ins->flags = 0;
+    ins->coissue = 0;
+    ins->predicate = NULL;
+    ins->dst_count = strlen(opcode_info->dst_info);
+    ins->dst = priv->dst_param;
+    ins->src_count = strlen(opcode_info->src_info);
+    ins->src = priv->src_param;
+
+    p = *ptr;
+    *ptr += len;
+
+    if (opcode_token & WINED3D_SM4_INSTRUCTION_MODIFIER)
+    {
+        DWORD modifier = *p++;
+        FIXME("Skipping modifier 0x%08x.\n", modifier);
+    }
+
+    if (opcode == WINED3D_SM4_OP_DCL_CONSTANT_BUFFER)
+    {
+        shader_sm4_read_src_param(priv, &p, WINED3D_DATA_FLOAT, &ins->declaration.src);
+        if (opcode_token & WINED3D_SM4_INDEX_TYPE_MASK)
+            ins->flags |= WINED3DSI_INDEXED_DYNAMIC;
+    }
+    else if (opcode == WINED3D_SM4_OP_DCL_OUTPUT_TOPOLOGY)
+    {
+        enum wined3d_sm4_output_primitive_type primitive_type;
+
+        primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
+        if (primitive_type >= sizeof(output_primitive_type_table) / sizeof(*output_primitive_type_table))
+        {
+            FIXME("Unhandled output primitive type %#x.\n", primitive_type);
+            ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
+        }
+        else
+        {
+            ins->declaration.primitive_type = output_primitive_type_table[primitive_type];
+        }
+    }
+    else if (opcode == WINED3D_SM4_OP_DCL_INPUT_PRIMITIVE)
+    {
+        enum wined3d_sm4_input_primitive_type primitive_type;
+
+        primitive_type = (opcode_token & WINED3D_SM4_PRIMITIVE_TYPE_MASK) >> WINED3D_SM4_PRIMITIVE_TYPE_SHIFT;
+        if (primitive_type >= sizeof(input_primitive_type_table) / sizeof(*input_primitive_type_table))
+        {
+            FIXME("Unhandled input primitive type %#x.\n", primitive_type);
+            ins->declaration.primitive_type = WINED3D_PT_UNDEFINED;
+        }
+        else
+        {
+            ins->declaration.primitive_type = input_primitive_type_table[primitive_type];
+        }
+    }
+    else if (opcode == WINED3D_SM4_OP_DCL_VERTICES_OUT)
+    {
+        ins->declaration.count = *p++;
+    }
+    else
+    {
+        for (i = 0; i < ins->dst_count; ++i)
+        {
+            if (!(shader_sm4_read_dst_param(priv, &p, map_data_type(opcode_info->dst_info[i]), &priv->dst_param[i])))
+            {
+                ins->handler_idx = WINED3DSIH_TABLE_SIZE;
+                return;
+            }
+        }
+
+        for (i = 0; i < ins->src_count; ++i)
+        {
+            if (!(shader_sm4_read_src_param(priv, &p, map_data_type(opcode_info->src_info[i]), &priv->src_param[i])))
+            {
+                ins->handler_idx = WINED3DSIH_TABLE_SIZE;
+                return;
+            }
+        }
+    }
 }
 
 static BOOL shader_sm4_is_end(void *data, const DWORD **ptr)
@@ -515,10 +801,6 @@ const struct wined3d_shader_frontend sm4_shader_frontend =
     shader_sm4_init,
     shader_sm4_free,
     shader_sm4_read_header,
-    shader_sm4_read_opcode,
-    shader_sm4_read_src_param,
-    shader_sm4_read_dst_param,
-    shader_sm4_read_semantic,
-    shader_sm4_read_comment,
+    shader_sm4_read_instruction,
     shader_sm4_is_end,
 };