-
Notifications
You must be signed in to change notification settings - Fork 4
/
xxGraphicD3DAsm.cpp
210 lines (209 loc) · 17.5 KB
/
xxGraphicD3DAsm.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
//==============================================================================
// xxGraphic : Direct3D Assembly Shader Source
//
// Copyright (c) 2019-2024 TAiGA
// https://github.com/metarutaiga/xxGraphic
//==============================================================================
#include "xxSystem.h"
#include "dxsdk/d3d9.h"
#include "dxsdk/d3d10TokenizedProgramFormat.hpp"
#include "internal/xxGraphicInternal.h"
#include "xxGraphicD3DAsm.h"
//==============================================================================
// Direct3D 8.0 Assembly Shader
//==============================================================================
#define D3DSP_WRITEMASK_ D3DSP_WRITEMASK_ALL
#define D3DSP_WRITEMASK_X D3DSP_WRITEMASK_0
#define D3DSP_WRITEMASK_XY D3DSP_WRITEMASK_X | D3DSP_WRITEMASK_1
#define D3DSP_WRITEMASK_XYZ D3DSP_WRITEMASK_XY | D3DSP_WRITEMASK_2
#define D3DSP_WRITEMASK_XYZW D3DSP_WRITEMASK_XYZW | D3DSP_WRITEMASK_3
#define D3DDECLUSAGE_UNKNOWN D3DSTT_UNKNOWN
#define D3DDECLUSAGE_2D D3DSTT_2D
#define D3DDECLUSAGE_CUBE D3DSTT_CUBE
#define D3DDECLUSAGE_VOLUME D3DSTT_VOLUME
#define D3DVS_X_ D3DVS_X_X
#define D3DVS_Y_ D3DVS_Y_Y
#define D3DVS_Z_ D3DVS_Z_Z
#define D3DVS_W_ D3DVS_W_W
#define D3DSIO(sio, length) (D3DSIO_ ## sio | (length << D3DSI_INSTLENGTH_SHIFT))
#define _TOKEN(mask, value) ((value << D3DSP_ ## mask ## _SHIFT)) | 0x80000000
#define _TOKEN1(mask, value) ((value << D3DSP_ ## mask ## _SHIFT) & D3DSP_ ## mask ## _MASK) | 0x80000000
#define _TOKEN2(mask, value) ((value << D3DSP_ ## mask ## _SHIFT2) & D3DSP_ ## mask ## _MASK2) | _TOKEN1(mask, value)
#define _DCL(dcl) _TOKEN(DCL_USAGE, D3DDECLUSAGE_ ## dcl)
#define _SRC(reg, index, ...) _TOKEN2(REGTYPE, D3DSPR_ ## reg) | D3DVS_W_ ## __VA_ARGS__ \
| D3DVS_Z_ ## __VA_ARGS__ \
| D3DVS_Y_ ## __VA_ARGS__ \
| D3DVS_X_ ## __VA_ARGS__ | index
#define _DST(reg, index, ...) _TOKEN2(REGTYPE, D3DSPR_ ## reg) | D3DSP_WRITEMASK_ ## __VA_ARGS__ | index
//------------------------------------------------------------------------------
const DWORD vertexShaderCode10[] =
{
D3DVS_VERSION(1, 0), // vs_1_0
D3DSIO_MUL, _DST(TEMP, 0), _SRC(CONST, 0), _SRC(INPUT, 0, X), // mul r0, c0, v0.x
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 1), _SRC(INPUT, 0, Y), _SRC(TEMP, 0), // mad r0, c1, v0.y, r0
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 2), _SRC(INPUT, 0, Z), _SRC(TEMP, 0), // mad r0, c2, v0.z, r0
D3DSIO_ADD, _DST(TEMP, 0), _SRC(CONST, 3), _SRC(TEMP, 0), // add r0, c3, r0
D3DSIO_MUL, _DST(TEMP, 1), _SRC(CONST, 4), _SRC(TEMP, 0, X), // mul r1, c4, r0.x
D3DSIO_MAD, _DST(TEMP, 1), _SRC(CONST, 5), _SRC(TEMP, 0, Y), _SRC(TEMP, 1), // mad r1, c5, r0.y, r1
D3DSIO_MAD, _DST(TEMP, 1), _SRC(CONST, 6), _SRC(TEMP, 0, Z), _SRC(TEMP, 1), // mad r1, c6, r0.z, r1
D3DSIO_MAD, _DST(TEMP, 1), _SRC(CONST, 7), _SRC(TEMP, 0, W), _SRC(TEMP, 1), // mad r1, c7, r0.w, r1
D3DSIO_MUL, _DST(TEMP, 0), _SRC(CONST, 8), _SRC(TEMP, 1, X), // mul r0, c8, r1.x
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 9), _SRC(TEMP, 1, Y), _SRC(TEMP, 0), // mad r0, c9, r1.y, r0
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 10), _SRC(TEMP, 1, Z), _SRC(TEMP, 0), // mad r0, c10, r1.z, r0
D3DSIO_MAD, _DST(RASTOUT, 0), _SRC(CONST, 11), _SRC(TEMP, 1, W), _SRC(TEMP, 0), // mad oPos, c11, r1.w, r0
D3DSIO_MOV, _DST(ATTROUT, 0), _SRC(INPUT, 5), // mov oD0, v5
D3DSIO_MOV, _DST(TEXCRDOUT, 0, XY), _SRC(INPUT, 7), // mov oT0.xy, v7
D3DSIO_END
};
//------------------------------------------------------------------------------
const DWORD vertexShaderCode11[] =
{
D3DVS_VERSION(1, 1), // vs_1_1
D3DSIO_DCL, _DCL(POSITION), _DST(INPUT, 0), // dcl_position v0
D3DSIO_DCL, _DCL(COLOR), _DST(INPUT, 1), // dcl_color v1
D3DSIO_DCL, _DCL(TEXCOORD), _DST(INPUT, 2), // dcl_texcoord v2
D3DSIO_MUL, _DST(TEMP, 0), _SRC(CONST, 0), _SRC(INPUT, 0, X), // mul r0, c0, v0.x
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 1), _SRC(INPUT, 0, Y), _SRC(TEMP, 0), // mad r0, c1, v0.y, r0
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 2), _SRC(INPUT, 0, Z), _SRC(TEMP, 0), // mad r0, c2, v0.z, r0
D3DSIO_ADD, _DST(TEMP, 0), _SRC(CONST, 3), _SRC(TEMP, 0), // add r0, c3, r0
D3DSIO_MUL, _DST(TEMP, 1), _SRC(CONST, 4), _SRC(TEMP, 0, X), // mul r1, c4, r0.x
D3DSIO_MAD, _DST(TEMP, 1), _SRC(CONST, 5), _SRC(TEMP, 0, Y), _SRC(TEMP, 1), // mad r1, c5, r0.y, r1
D3DSIO_MAD, _DST(TEMP, 1), _SRC(CONST, 6), _SRC(TEMP, 0, Z), _SRC(TEMP, 1), // mad r1, c6, r0.z, r1
D3DSIO_MAD, _DST(TEMP, 1), _SRC(CONST, 7), _SRC(TEMP, 0, W), _SRC(TEMP, 1), // mad r1, c7, r0.w, r1
D3DSIO_MUL, _DST(TEMP, 0), _SRC(CONST, 8), _SRC(TEMP, 1, X), // mul r0, c8, r1.x
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 9), _SRC(TEMP, 1, Y), _SRC(TEMP, 0), // mad r0, c9, r1.y, r0
D3DSIO_MAD, _DST(TEMP, 0), _SRC(CONST, 10), _SRC(TEMP, 1, Z), _SRC(TEMP, 0), // mad r0, c10, r1.z, r0
D3DSIO_MAD, _DST(RASTOUT, 0), _SRC(CONST, 11), _SRC(TEMP, 1, W), _SRC(TEMP, 0), // mad oPos, c11, r1.w, r0
D3DSIO_MOV, _DST(ATTROUT, 0), _SRC(INPUT, 1), // mov oD0, v1
D3DSIO_MOV, _DST(TEXCRDOUT, 0, XY), _SRC(INPUT, 2), // mov oT0.xy, v2
D3DSIO_END
};
//------------------------------------------------------------------------------
const DWORD pixelShaderCode10[] =
{
D3DPS_VERSION(1, 0), // ps_1_0
D3DSIO_TEX, _DST(TEXTURE, 0), // tex t0
D3DSIO_MUL, _DST(TEMP, 0), _SRC(TEXTURE, 0), _SRC(INPUT, 0), // mul r0, t0, v0
D3DSIO_END
};
//------------------------------------------------------------------------------
const DWORD pixelShaderCode20[] =
{
D3DPS_VERSION(2, 0), // ps_2_0
D3DSIO(DCL, 2), _DCL(UNKNOWN), _DST(INPUT, 0), // dcl v0
D3DSIO(DCL, 2), _DCL(UNKNOWN), _DST(TEXTURE, 0), // dcl t0.xy
D3DSIO(DCL, 2), _DCL(2D), _DST(SAMPLER, 0), // dcl_2d s0
D3DSIO(TEX, 3), _DST(TEMP, 0), _SRC(TEXTURE, 0), _SRC(SAMPLER, 0), // texld r0, t0, s0
D3DSIO(MUL, 3), _DST(TEMP, 0), _SRC(TEMP, 0), _SRC(INPUT, 0), // mul r0, r0, v0
D3DSIO(MOV, 2), _DST(COLOROUT, 0), _SRC(TEMP, 0), // mov oC0, r0
D3DSIO(END, 0)
};
//==============================================================================
// Direct3D 10.0 Assembly Shader
//==============================================================================
#define _POSITION 0x49534f50, 0x4e4f4954
#define _COLOR 0x4f4c4f43, 0x00000052
#define _TEXCOORD 0x43584554, 0x44524f4f
#define _SV_POSITION 0x505f5653, 0x5449534f, 0x004e4f49
#define _SV_TARGET 0x545f5653, 0x45475241, 0x00000054
#define D3D10_SB_4_COMPONENT_ D3D10_SB_4_COMPONENT_XYZW
#define D3D10_SB_4_COMPONENT_XXXX ((D3D10_SB_4_COMPONENT_X << 0) | (D3D10_SB_4_COMPONENT_X << 2) | (D3D10_SB_4_COMPONENT_X << 4) | (D3D10_SB_4_COMPONENT_X << 6))
#define D3D10_SB_4_COMPONENT_XYXX ((D3D10_SB_4_COMPONENT_X << 0) | (D3D10_SB_4_COMPONENT_Y << 2) | (D3D10_SB_4_COMPONENT_X << 4) | (D3D10_SB_4_COMPONENT_X << 6))
#define D3D10_SB_4_COMPONENT_XYZW ((D3D10_SB_4_COMPONENT_X << 0) | (D3D10_SB_4_COMPONENT_Y << 2) | (D3D10_SB_4_COMPONENT_Z << 4) | (D3D10_SB_4_COMPONENT_W << 6))
#define D3D10_SB_4_COMPONENT_YYYY ((D3D10_SB_4_COMPONENT_Y << 0) | (D3D10_SB_4_COMPONENT_Y << 2) | (D3D10_SB_4_COMPONENT_Y << 4) | (D3D10_SB_4_COMPONENT_Y << 6))
#define D3D10_SB_4_COMPONENT_ZZZZ ((D3D10_SB_4_COMPONENT_Z << 0) | (D3D10_SB_4_COMPONENT_Z << 2) | (D3D10_SB_4_COMPONENT_Z << 4) | (D3D10_SB_4_COMPONENT_Z << 6))
#define D3D10_SB_4_COMPONENT_WWWW ((D3D10_SB_4_COMPONENT_W << 0) | (D3D10_SB_4_COMPONENT_W << 2) | (D3D10_SB_4_COMPONENT_W << 4) | (D3D10_SB_4_COMPONENT_W << 6))
#define D3D10_SB_OPERAND_4_COMPONENT_MASK_ D3D10_SB_OPERAND_4_COMPONENT_MASK_XYZW
#define D3D10_SB_OPERAND_4_COMPONENT_MASK_XY (D3D10_SB_OPERAND_4_COMPONENT_MASK_X | D3D10_SB_OPERAND_4_COMPONENT_MASK_Y)
#define D3D10_SB_OPERAND_4_COMPONENT_MASK_XYZ (D3D10_SB_OPERAND_4_COMPONENT_MASK_XY | D3D10_SB_OPERAND_4_COMPONENT_MASK_Z)
#define D3D10_SB_OPERAND_4_COMPONENT_MASK_XYZW (D3D10_SB_OPERAND_4_COMPONENT_MASK_XYZ | D3D10_SB_OPERAND_4_COMPONENT_MASK_W)
#define D3D10_SB_RETURN_TYPE_FLOAT4 ((D3D10_SB_RETURN_TYPE_FLOAT << 0) | (D3D10_SB_RETURN_TYPE_FLOAT << 4) | (D3D10_SB_RETURN_TYPE_FLOAT << 8) | (D3D10_SB_RETURN_TYPE_FLOAT << 12))
#define _OP(opcode, length) (D3D10_SB_OPCODE_ ## opcode | ENCODE_D3D10_SB_TOKENIZED_INSTRUCTION_LENGTH(length))
#define _OP_DIMENSION(opcode, length, dim) (_OP(opcode, length) | ENCODE_D3D10_SB_RESOURCE_DIMENSION(D3D10_SB_RESOURCE_DIMENSION_ ## dim))
#define _OP_INTERPOLATION(opcode, length, int) (_OP(opcode, length) | ENCODE_D3D10_SB_INPUT_INTERPOLATION_MODE(D3D10_SB_INTERPOLATION_ ## int))
#define _0(index, reg) ENCODE_D3D10_SB_OPERAND_NUM_COMPONENTS(D3D10_SB_OPERAND_0_COMPONENT) | \
ENCODE_D3D10_SB_OPERAND_INDEX_DIMENSION(D3D10_SB_OPERAND_INDEX_ ## index) | \
ENCODE_D3D10_SB_OPERAND_TYPE(D3D10_SB_OPERAND_TYPE_ ## reg)
#define _4M(index, reg, ...) ENCODE_D3D10_SB_OPERAND_NUM_COMPONENTS(D3D10_SB_OPERAND_4_COMPONENT) | \
ENCODE_D3D10_SB_OPERAND_4_COMPONENT_SELECTION_MODE(D3D10_SB_OPERAND_4_COMPONENT_MASK_MODE) | \
ENCODE_D3D10_SB_OPERAND_INDEX_DIMENSION(D3D10_SB_OPERAND_INDEX_ ## index) | \
ENCODE_D3D10_SB_OPERAND_TYPE(D3D10_SB_OPERAND_TYPE_ ## reg) | \
(D3D10_SB_OPERAND_4_COMPONENT_MASK_ ## __VA_ARGS__)
#define _4S(index, reg, ...) ENCODE_D3D10_SB_OPERAND_NUM_COMPONENTS(D3D10_SB_OPERAND_4_COMPONENT) | \
ENCODE_D3D10_SB_OPERAND_4_COMPONENT_SELECTION_MODE(D3D10_SB_OPERAND_4_COMPONENT_SWIZZLE_MODE) | \
ENCODE_D3D10_SB_OPERAND_INDEX_DIMENSION(D3D10_SB_OPERAND_INDEX_ ## index) | \
ENCODE_D3D10_SB_OPERAND_TYPE(D3D10_SB_OPERAND_TYPE_ ## reg) | \
(D3D10_SB_4_COMPONENT_ ## __VA_ARGS__ << D3D10_SB_OPERAND_4_COMPONENT_SWIZZLE_SHIFT)
//------------------------------------------------------------------------------
const DWORD vertexShaderCode40[] =
{
"DXBC"_cc, 0x594d7a0d, 0x1efb9a50, 0x00b96a57, 0xf05960a9,
0x00000001, 0x00000388, 3,
0x0000002c, 0x000000a8, 0x00000128,
"ISGN"_cc, 0x00000074, 3, 0x00000008,
0x00000050, 0, 0, 3, 0, 0x0707,
0x0000005c, 0, 0, 3, 1, 0x0f0f,
0x00000068, 0, 0, 3, 2, 0x0303,
_POSITION, 0,
_COLOR, 0,
_TEXCOORD, 0,
"OSGN"_cc, 0x00000078, 3, 0x00000008,
0x00000050, 0, 1, 3, 0, 0x000f,
0x00000060, 0, 0, 3, 1, 0x000f,
0x0000006c, 0, 0, 3, 2, 0x0c03,
_SV_POSITION, 0,
_COLOR, 0,
_TEXCOORD, 0,
"SHDR"_cc, 0x00000258, ENCODE_D3D10_SB_TOKENIZED_PROGRAM_VERSION_TOKEN(D3D10_SB_VERTEX_SHADER, 4, 0), 0x00000096,
_OP(DCL_CONSTANT_BUFFER, 4), _4S(2D, CONSTANT_BUFFER), D3D10_SB_CONSTANT_BUFFER_IMMEDIATE_INDEXED, 12, // dcl_constantbuffer CB0[12], immediateIndexed
_OP(DCL_INPUT, 3), _4M(1D, INPUT, XYZ), 0, // dcl_input v0.xyz
_OP(DCL_INPUT, 3), _4M(1D, INPUT), 1, // dcl_input v1.xyzw
_OP(DCL_INPUT, 3), _4M(1D, INPUT, XY), 2, // dcl_input v2.xy
_OP(DCL_OUTPUT_SIV, 4), _4M(1D, OUTPUT), 0, 1, // dcl_output_siv o0.xyzw
_OP(DCL_OUTPUT, 3), _4M(1D, OUTPUT), 1, // dcl_output o1.xyzw
_OP(DCL_OUTPUT, 3), _4M(1D, OUTPUT, XY), 2, // dcl_output o2.xy
_OP(DCL_TEMPS, 2), 2, // dcl_temps 2
_OP(MUL, 8), _4M(1D, TEMP), 0, _4S(2D, CONSTANT_BUFFER), 0, 0, _4S(1D, INPUT, XXXX), 0, // mul r0.xyzw, cb0[0].xyzw, v0.xxxx
_OP(MAD, 10), _4M(1D, TEMP), 0, _4S(2D, CONSTANT_BUFFER), 0, 1, _4S(1D, INPUT, YYYY), 0, _4S(1D, TEMP), 0, // mad r0.xyzw, cb0[1].xyzw, v0.yyyy, r0.xyzw
_OP(MAD, 10), _4M(1D, TEMP), 0, _4S(2D, CONSTANT_BUFFER), 0, 2, _4S(1D, INPUT, ZZZZ), 0, _4S(1D, TEMP), 0, // mad r0.xyzw, cb0[2].xyzw, v0.zzzz, r0.xyzw
_OP(ADD, 8), _4M(1D, TEMP), 0, _4S(2D, CONSTANT_BUFFER), 0, 3, _4S(1D, TEMP), 0, // add r0.xyzw, cb0[3].xyzw, r0.xyzw
_OP(MUL, 8), _4M(1D, TEMP), 1, _4S(2D, CONSTANT_BUFFER), 0, 4, _4S(1D, TEMP, XXXX), 0, // mul r1.xyzw, cb0[4].xyzw, r0.xxxx
_OP(MAD, 10), _4M(1D, TEMP), 1, _4S(2D, CONSTANT_BUFFER), 0, 5, _4S(1D, TEMP, YYYY), 0, _4S(1D, TEMP), 1, // mad r1.xyzw, cb0[5].xyzw, r0.yyyy, r1.xyzw
_OP(MAD, 10), _4M(1D, TEMP), 1, _4S(2D, CONSTANT_BUFFER), 0, 6, _4S(1D, TEMP, ZZZZ), 0, _4S(1D, TEMP), 1, // mad r1.xyzw, cb0[6].xyzw, r0.zzzz, r1.xyzw
_OP(MAD, 10), _4M(1D, TEMP), 1, _4S(2D, CONSTANT_BUFFER), 0, 7, _4S(1D, TEMP, WWWW), 0, _4S(1D, TEMP), 1, // mad r1.xyzw, cb0[7].xyzw, r0.zzzz, r1.xyzw
_OP(MUL, 8), _4M(1D, TEMP), 0, _4S(2D, CONSTANT_BUFFER), 0, 8, _4S(1D, TEMP, XXXX), 1, // mul r0.xyzw, cb0[8].xyzw, r1.xxxx
_OP(MAD, 10), _4M(1D, TEMP), 0, _4S(2D, CONSTANT_BUFFER), 0, 9, _4S(1D, TEMP, YYYY), 1, _4S(1D, TEMP), 0, // mad r0.xyzw, cb0[9].xyzw, r1.yyyy, r0.xyzw
_OP(MAD, 10), _4M(1D, TEMP), 0, _4S(2D, CONSTANT_BUFFER), 0, 10, _4S(1D, TEMP, ZZZZ), 1, _4S(1D, TEMP), 0, // mad r0.xyzw, cb0[10].xyzw, r1.zzzz, r0.xyzw
_OP(MAD, 10), _4M(1D, OUTPUT), 0, _4S(2D, CONSTANT_BUFFER), 0, 11, _4S(1D, TEMP, WWWW), 1, _4S(1D, TEMP), 0, // mad o0.xyzw, cb0[11].xyzw, r1.zzzz, r0.xyzw
_OP(MOV, 5), _4M(1D, OUTPUT), 1, _4S(1D, INPUT), 1, // mov o1.xyzw, v1.xyzw
_OP(MOV, 5), _4M(1D, OUTPUT, XY), 2, _4S(1D, INPUT, XYXX), 2, // mov o2.xy, v2.xyxx
_OP(RET, 1) // ret
};
//------------------------------------------------------------------------------
const DWORD pixelShaderCode40[] =
{
"DXBC"_cc, 0x699f5ee8, 0xcbd8a667, 0xedaa31ef, 0x41715e6e,
0x00000001, 0x00000180, 3,
0x0000002c, 0x000000ac, 0x000000e4,
"ISGN"_cc, 0x00000078, 3, 0x00000008,
0x00000050, 0, 1, 3, 0, 0x000f,
0x00000060, 0, 0, 3, 1, 0x0f0f,
0x0000006c, 0, 0, 3, 2, 0x0303,
_SV_POSITION, 0,
_COLOR, 0,
_TEXCOORD, 0,
"OSGN"_cc, 0x00000030, 1, 0x00000008,
0x00000020, 0, 0, 3, 0, 0x000f,
_SV_TARGET, 0,
"SHDR"_cc, 0x00000094, ENCODE_D3D10_SB_TOKENIZED_PROGRAM_VERSION_TOKEN(D3D10_SB_PIXEL_SHADER, 4, 0), 0x00000025,
_OP(DCL_SAMPLER, 3), _0(1D, SAMPLER), D3D10_SB_SAMPLER_MODE_DEFAULT, // dcl_sampler s0, mode_default
_OP_DIMENSION(DCL_RESOURCE, 4, TEXTURE2D), _0(1D, RESOURCE), 0, D3D10_SB_RETURN_TYPE_FLOAT4, // dcl_resource_texture2d(float,float,float,float) t0
_OP_INTERPOLATION(DCL_INPUT_PS, 3, LINEAR), _4M(1D, INPUT), 1, // dcl_input_ps linear v1.xyzw
_OP_INTERPOLATION(DCL_INPUT_PS, 3, LINEAR), _4M(1D, INPUT, XY), 2, // dcl_input_ps linear v2.xy
_OP(DCL_OUTPUT, 3), _4M(1D, OUTPUT), 0, // dcl_output o0.xyzw
_OP(DCL_TEMPS, 2), 1, // dcl_temps 1
_OP(SAMPLE, 9), _4M(1D, TEMP), 0, _4S(1D, INPUT, XYXX), 2, _4S(1D, RESOURCE), 0, _0(1D, SAMPLER), 0, // sample r0.xyzw, v2.xyxx, t0.xyzw, s0
_OP(MUL, 7), _4M(1D, OUTPUT), 0, _4S(1D, TEMP), 0, _4S(1D, INPUT), 1, // mul o0.xyzw, r0.xyzw, v1.xyzw
_OP(RET, 1) // ret
};
//------------------------------------------------------------------------------