2 * Direct3D bytecode output functions
4 * Copyright 2008 Stefan Dösinger
5 * Copyright 2009 Matteo Bruni
7 * This library is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * This library is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with this library; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
24 #include "wine/port.h"
25 #include "wine/debug.h"
27 #include "d3d9types.h"
28 #include "d3dcompiler_private.h"
30 WINE_DEFAULT_DEBUG_CHANNEL(bytecodewriter
);
32 /****************************************************************
33 * General assembler shader construction helper routines follow *
34 ****************************************************************/
35 /* struct instruction *alloc_instr
37 * Allocates a new instruction structure with srcs registers
40 * srcs: Number of source registers to allocate
43 * A pointer to the allocated instruction structure
44 * NULL in case of an allocation failure
46 struct instruction
*alloc_instr(unsigned int srcs
) {
47 struct instruction
*ret
= d3dcompiler_alloc(sizeof(*ret
));
49 ERR("Failed to allocate memory for an instruction structure\n");
54 ret
->src
= d3dcompiler_alloc(srcs
* sizeof(*ret
->src
));
56 ERR("Failed to allocate memory for instruction registers\n");
57 d3dcompiler_free(ret
);
65 /* void add_instruction
67 * Adds a new instruction to the shader's instructions array and grows the instruction array
70 * The function does NOT copy the instruction structure. Make sure not to release the
71 * instruction or any of its substructures like registers.
74 * shader: Shader to add the instruction to
75 * instr: Instruction to add to the shader
77 BOOL
add_instruction(struct bwriter_shader
*shader
, struct instruction
*instr
) {
78 struct instruction
**new_instructions
;
80 if(!shader
) return FALSE
;
82 if(shader
->instr_alloc_size
== 0) {
83 shader
->instr
= d3dcompiler_alloc(sizeof(*shader
->instr
) * INSTRARRAY_INITIAL_SIZE
);
85 ERR("Failed to allocate the shader instruction array\n");
88 shader
->instr_alloc_size
= INSTRARRAY_INITIAL_SIZE
;
89 } else if(shader
->instr_alloc_size
== shader
->num_instrs
) {
90 new_instructions
= d3dcompiler_realloc(shader
->instr
,
91 sizeof(*shader
->instr
) * (shader
->instr_alloc_size
) * 2);
92 if(!new_instructions
) {
93 ERR("Failed to grow the shader instruction array\n");
96 shader
->instr
= new_instructions
;
97 shader
->instr_alloc_size
= shader
->instr_alloc_size
* 2;
98 } else if(shader
->num_instrs
> shader
->instr_alloc_size
) {
99 ERR("More instructions than allocated. This should not happen\n");
103 shader
->instr
[shader
->num_instrs
] = instr
;
104 shader
->num_instrs
++;
108 BOOL
add_constF(struct bwriter_shader
*shader
, DWORD reg
, float x
, float y
, float z
, float w
) {
109 struct constant
*newconst
;
112 struct constant
**newarray
;
113 newarray
= d3dcompiler_realloc(shader
->constF
,
114 sizeof(*shader
->constF
) * (shader
->num_cf
+ 1));
116 ERR("Failed to grow the constants array\n");
119 shader
->constF
= newarray
;
121 shader
->constF
= d3dcompiler_alloc(sizeof(*shader
->constF
));
122 if(!shader
->constF
) {
123 ERR("Failed to allocate the constants array\n");
128 newconst
= d3dcompiler_alloc(sizeof(*newconst
));
130 ERR("Failed to allocate a new constant\n");
133 newconst
->regnum
= reg
;
134 newconst
->value
[0].f
= x
;
135 newconst
->value
[1].f
= y
;
136 newconst
->value
[2].f
= z
;
137 newconst
->value
[3].f
= w
;
138 shader
->constF
[shader
->num_cf
] = newconst
;
144 BOOL
add_constI(struct bwriter_shader
*shader
, DWORD reg
, INT x
, INT y
, INT z
, INT w
) {
145 struct constant
*newconst
;
148 struct constant
**newarray
;
149 newarray
= d3dcompiler_realloc(shader
->constI
,
150 sizeof(*shader
->constI
) * (shader
->num_ci
+ 1));
152 ERR("Failed to grow the constants array\n");
155 shader
->constI
= newarray
;
157 shader
->constI
= d3dcompiler_alloc(sizeof(*shader
->constI
));
158 if(!shader
->constI
) {
159 ERR("Failed to allocate the constants array\n");
164 newconst
= d3dcompiler_alloc(sizeof(*newconst
));
166 ERR("Failed to allocate a new constant\n");
169 newconst
->regnum
= reg
;
170 newconst
->value
[0].i
= x
;
171 newconst
->value
[1].i
= y
;
172 newconst
->value
[2].i
= z
;
173 newconst
->value
[3].i
= w
;
174 shader
->constI
[shader
->num_ci
] = newconst
;
180 BOOL
add_constB(struct bwriter_shader
*shader
, DWORD reg
, BOOL x
) {
181 struct constant
*newconst
;
184 struct constant
**newarray
;
185 newarray
= d3dcompiler_realloc(shader
->constB
,
186 sizeof(*shader
->constB
) * (shader
->num_cb
+ 1));
188 ERR("Failed to grow the constants array\n");
191 shader
->constB
= newarray
;
193 shader
->constB
= d3dcompiler_alloc(sizeof(*shader
->constB
));
194 if(!shader
->constB
) {
195 ERR("Failed to allocate the constants array\n");
200 newconst
= d3dcompiler_alloc(sizeof(*newconst
));
202 ERR("Failed to allocate a new constant\n");
205 newconst
->regnum
= reg
;
206 newconst
->value
[0].b
= x
;
207 shader
->constB
[shader
->num_cb
] = newconst
;
213 BOOL
record_declaration(struct bwriter_shader
*shader
, DWORD usage
,
214 DWORD usage_idx
, DWORD mod
, BOOL output
,
215 DWORD regnum
, DWORD writemask
, BOOL builtin
) {
217 struct declaration
**decl
;
220 if(!shader
) return FALSE
;
223 num
= &shader
->num_outputs
;
224 decl
= &shader
->outputs
;
226 num
= &shader
->num_inputs
;
227 decl
= &shader
->inputs
;
231 *decl
= d3dcompiler_alloc(sizeof(**decl
));
233 ERR("Error allocating declarations array\n");
237 struct declaration
*newdecl
;
238 for(i
= 0; i
< *num
; i
++) {
239 if((*decl
)[i
].regnum
== regnum
&& ((*decl
)[i
].writemask
& writemask
)) {
240 WARN("Declaration of register %u already exists, writemask match 0x%x\n",
241 regnum
, (*decl
)[i
].writemask
& writemask
);
245 newdecl
= d3dcompiler_realloc(*decl
,
246 sizeof(**decl
) * ((*num
) + 1));
248 ERR("Error reallocating declarations array\n");
253 (*decl
)[*num
].usage
= usage
;
254 (*decl
)[*num
].usage_idx
= usage_idx
;
255 (*decl
)[*num
].regnum
= regnum
;
256 (*decl
)[*num
].mod
= mod
;
257 (*decl
)[*num
].writemask
= writemask
;
258 (*decl
)[*num
].builtin
= builtin
;
264 BOOL
record_sampler(struct bwriter_shader
*shader
, DWORD samptype
, DWORD mod
, DWORD regnum
) {
267 if(!shader
) return FALSE
;
269 if(shader
->num_samplers
== 0) {
270 shader
->samplers
= d3dcompiler_alloc(sizeof(*shader
->samplers
));
271 if(!shader
->samplers
) {
272 ERR("Error allocating samplers array\n");
276 struct samplerdecl
*newarray
;
278 for(i
= 0; i
< shader
->num_samplers
; i
++) {
279 if(shader
->samplers
[i
].regnum
== regnum
) {
280 WARN("Sampler %u already declared\n", regnum
);
281 /* This is not an error as far as the assembler is concerned.
282 * Direct3D might refuse to load the compiled shader though
287 newarray
= d3dcompiler_realloc(shader
->samplers
,
288 sizeof(*shader
->samplers
) * (shader
->num_samplers
+ 1));
290 ERR("Error reallocating samplers array\n");
293 shader
->samplers
= newarray
;
296 shader
->samplers
[shader
->num_samplers
].type
= samptype
;
297 shader
->samplers
[shader
->num_samplers
].mod
= mod
;
298 shader
->samplers
[shader
->num_samplers
].regnum
= regnum
;
299 shader
->num_samplers
++;
304 /* shader bytecode buffer manipulation functions.
305 * allocate_buffer creates a new buffer structure, put_dword adds a new
306 * DWORD to the buffer. In the rare case of a memory allocation failure
307 * when trying to grow the buffer a flag is set in the buffer to mark it
308 * invalid. This avoids return value checking and passing in many places
310 static struct bytecode_buffer
*allocate_buffer(void) {
311 struct bytecode_buffer
*ret
;
313 ret
= d3dcompiler_alloc(sizeof(*ret
));
314 if(!ret
) return NULL
;
316 ret
->alloc_size
= BYTECODEBUFFER_INITIAL_SIZE
;
317 ret
->data
= d3dcompiler_alloc(sizeof(DWORD
) * ret
->alloc_size
);
319 d3dcompiler_free(ret
);
326 static void put_dword(struct bytecode_buffer
*buffer
, DWORD value
) {
327 if(FAILED(buffer
->state
)) return;
329 if(buffer
->alloc_size
== buffer
->size
) {
331 buffer
->alloc_size
*= 2;
332 newarray
= d3dcompiler_realloc(buffer
->data
,
333 sizeof(DWORD
) * buffer
->alloc_size
);
335 ERR("Failed to grow the buffer data memory\n");
336 buffer
->state
= E_OUTOFMEMORY
;
339 buffer
->data
= newarray
;
341 buffer
->data
[buffer
->size
++] = value
;
344 /* bwriter -> d3d9 conversion functions. */
345 static DWORD
d3d9_swizzle(DWORD bwriter_swizzle
)
347 /* Currently a NOP, but this allows changing the internal definitions
348 * without side effects. */
351 if ((bwriter_swizzle
& BWRITERVS_X_X
) == BWRITERVS_X_X
) ret
|= D3DVS_X_X
;
352 if ((bwriter_swizzle
& BWRITERVS_X_Y
) == BWRITERVS_X_Y
) ret
|= D3DVS_X_Y
;
353 if ((bwriter_swizzle
& BWRITERVS_X_Z
) == BWRITERVS_X_Z
) ret
|= D3DVS_X_Z
;
354 if ((bwriter_swizzle
& BWRITERVS_X_W
) == BWRITERVS_X_W
) ret
|= D3DVS_X_W
;
356 if ((bwriter_swizzle
& BWRITERVS_Y_X
) == BWRITERVS_Y_X
) ret
|= D3DVS_Y_X
;
357 if ((bwriter_swizzle
& BWRITERVS_Y_Y
) == BWRITERVS_Y_Y
) ret
|= D3DVS_Y_Y
;
358 if ((bwriter_swizzle
& BWRITERVS_Y_Z
) == BWRITERVS_Y_Z
) ret
|= D3DVS_Y_Z
;
359 if ((bwriter_swizzle
& BWRITERVS_Y_W
) == BWRITERVS_Y_W
) ret
|= D3DVS_Y_W
;
361 if ((bwriter_swizzle
& BWRITERVS_Z_X
) == BWRITERVS_Z_X
) ret
|= D3DVS_Z_X
;
362 if ((bwriter_swizzle
& BWRITERVS_Z_Y
) == BWRITERVS_Z_Y
) ret
|= D3DVS_Z_Y
;
363 if ((bwriter_swizzle
& BWRITERVS_Z_Z
) == BWRITERVS_Z_Z
) ret
|= D3DVS_Z_Z
;
364 if ((bwriter_swizzle
& BWRITERVS_Z_W
) == BWRITERVS_Z_W
) ret
|= D3DVS_Z_W
;
366 if ((bwriter_swizzle
& BWRITERVS_W_X
) == BWRITERVS_W_X
) ret
|= D3DVS_W_X
;
367 if ((bwriter_swizzle
& BWRITERVS_W_Y
) == BWRITERVS_W_Y
) ret
|= D3DVS_W_Y
;
368 if ((bwriter_swizzle
& BWRITERVS_W_Z
) == BWRITERVS_W_Z
) ret
|= D3DVS_W_Z
;
369 if ((bwriter_swizzle
& BWRITERVS_W_W
) == BWRITERVS_W_W
) ret
|= D3DVS_W_W
;
374 static DWORD
d3d9_writemask(DWORD bwriter_writemask
)
378 if (bwriter_writemask
& BWRITERSP_WRITEMASK_0
) ret
|= D3DSP_WRITEMASK_0
;
379 if (bwriter_writemask
& BWRITERSP_WRITEMASK_1
) ret
|= D3DSP_WRITEMASK_1
;
380 if (bwriter_writemask
& BWRITERSP_WRITEMASK_2
) ret
|= D3DSP_WRITEMASK_2
;
381 if (bwriter_writemask
& BWRITERSP_WRITEMASK_3
) ret
|= D3DSP_WRITEMASK_3
;
386 static DWORD
d3d9_srcmod(DWORD bwriter_srcmod
)
388 switch (bwriter_srcmod
)
390 case BWRITERSPSM_NONE
: return D3DSPSM_NONE
;
391 case BWRITERSPSM_NEG
: return D3DSPSM_NEG
;
392 case BWRITERSPSM_BIAS
: return D3DSPSM_BIAS
;
393 case BWRITERSPSM_BIASNEG
: return D3DSPSM_BIASNEG
;
394 case BWRITERSPSM_SIGN
: return D3DSPSM_SIGN
;
395 case BWRITERSPSM_SIGNNEG
: return D3DSPSM_SIGNNEG
;
396 case BWRITERSPSM_COMP
: return D3DSPSM_COMP
;
397 case BWRITERSPSM_X2
: return D3DSPSM_X2
;
398 case BWRITERSPSM_X2NEG
: return D3DSPSM_X2NEG
;
399 case BWRITERSPSM_DZ
: return D3DSPSM_DZ
;
400 case BWRITERSPSM_DW
: return D3DSPSM_DW
;
401 case BWRITERSPSM_ABS
: return D3DSPSM_ABS
;
402 case BWRITERSPSM_ABSNEG
: return D3DSPSM_ABSNEG
;
403 case BWRITERSPSM_NOT
: return D3DSPSM_NOT
;
405 FIXME("Unhandled BWRITERSPSM token %#x.\n", bwriter_srcmod
);
410 static DWORD
d3d9_dstmod(DWORD bwriter_mod
)
414 if (bwriter_mod
& BWRITERSPDM_SATURATE
) ret
|= D3DSPDM_SATURATE
;
415 if (bwriter_mod
& BWRITERSPDM_PARTIALPRECISION
) ret
|= D3DSPDM_PARTIALPRECISION
;
416 if (bwriter_mod
& BWRITERSPDM_MSAMPCENTROID
) ret
|= D3DSPDM_MSAMPCENTROID
;
421 static DWORD
d3d9_comparetype(DWORD asmshader_comparetype
)
423 switch (asmshader_comparetype
)
425 case BWRITER_COMPARISON_GT
: return D3DSPC_GT
;
426 case BWRITER_COMPARISON_EQ
: return D3DSPC_EQ
;
427 case BWRITER_COMPARISON_GE
: return D3DSPC_GE
;
428 case BWRITER_COMPARISON_LT
: return D3DSPC_LT
;
429 case BWRITER_COMPARISON_NE
: return D3DSPC_NE
;
430 case BWRITER_COMPARISON_LE
: return D3DSPC_LE
;
432 FIXME("Unexpected BWRITER_COMPARISON type %#x.\n", asmshader_comparetype
);
437 static DWORD
d3d9_sampler(DWORD bwriter_sampler
)
439 if (bwriter_sampler
== BWRITERSTT_UNKNOWN
) return D3DSTT_UNKNOWN
;
440 if (bwriter_sampler
== BWRITERSTT_1D
) return D3DSTT_1D
;
441 if (bwriter_sampler
== BWRITERSTT_2D
) return D3DSTT_2D
;
442 if (bwriter_sampler
== BWRITERSTT_CUBE
) return D3DSTT_CUBE
;
443 if (bwriter_sampler
== BWRITERSTT_VOLUME
) return D3DSTT_VOLUME
;
444 FIXME("Unexpected BWRITERSAMPLER_TEXTURE_TYPE type %#x.\n", bwriter_sampler
);
449 static DWORD
d3d9_register(DWORD bwriter_register
)
451 if (bwriter_register
== BWRITERSPR_TEMP
) return D3DSPR_TEMP
;
452 if (bwriter_register
== BWRITERSPR_INPUT
) return D3DSPR_INPUT
;
453 if (bwriter_register
== BWRITERSPR_CONST
) return D3DSPR_CONST
;
454 if (bwriter_register
== BWRITERSPR_ADDR
) return D3DSPR_ADDR
;
455 if (bwriter_register
== BWRITERSPR_TEXTURE
) return D3DSPR_TEXTURE
;
456 if (bwriter_register
== BWRITERSPR_RASTOUT
) return D3DSPR_RASTOUT
;
457 if (bwriter_register
== BWRITERSPR_ATTROUT
) return D3DSPR_ATTROUT
;
458 if (bwriter_register
== BWRITERSPR_TEXCRDOUT
) return D3DSPR_TEXCRDOUT
;
459 if (bwriter_register
== BWRITERSPR_OUTPUT
) return D3DSPR_OUTPUT
;
460 if (bwriter_register
== BWRITERSPR_CONSTINT
) return D3DSPR_CONSTINT
;
461 if (bwriter_register
== BWRITERSPR_COLOROUT
) return D3DSPR_COLOROUT
;
462 if (bwriter_register
== BWRITERSPR_DEPTHOUT
) return D3DSPR_DEPTHOUT
;
463 if (bwriter_register
== BWRITERSPR_SAMPLER
) return D3DSPR_SAMPLER
;
464 if (bwriter_register
== BWRITERSPR_CONSTBOOL
) return D3DSPR_CONSTBOOL
;
465 if (bwriter_register
== BWRITERSPR_LOOP
) return D3DSPR_LOOP
;
466 if (bwriter_register
== BWRITERSPR_MISCTYPE
) return D3DSPR_MISCTYPE
;
467 if (bwriter_register
== BWRITERSPR_LABEL
) return D3DSPR_LABEL
;
468 if (bwriter_register
== BWRITERSPR_PREDICATE
) return D3DSPR_PREDICATE
;
470 FIXME("Unexpected BWRITERSPR %#x.\n", bwriter_register
);
474 static DWORD
d3d9_opcode(DWORD bwriter_opcode
)
476 switch (bwriter_opcode
)
478 case BWRITERSIO_NOP
: return D3DSIO_NOP
;
479 case BWRITERSIO_MOV
: return D3DSIO_MOV
;
480 case BWRITERSIO_ADD
: return D3DSIO_ADD
;
481 case BWRITERSIO_SUB
: return D3DSIO_SUB
;
482 case BWRITERSIO_MAD
: return D3DSIO_MAD
;
483 case BWRITERSIO_MUL
: return D3DSIO_MUL
;
484 case BWRITERSIO_RCP
: return D3DSIO_RCP
;
485 case BWRITERSIO_RSQ
: return D3DSIO_RSQ
;
486 case BWRITERSIO_DP3
: return D3DSIO_DP3
;
487 case BWRITERSIO_DP4
: return D3DSIO_DP4
;
488 case BWRITERSIO_MIN
: return D3DSIO_MIN
;
489 case BWRITERSIO_MAX
: return D3DSIO_MAX
;
490 case BWRITERSIO_SLT
: return D3DSIO_SLT
;
491 case BWRITERSIO_SGE
: return D3DSIO_SGE
;
492 case BWRITERSIO_EXP
: return D3DSIO_EXP
;
493 case BWRITERSIO_LOG
: return D3DSIO_LOG
;
494 case BWRITERSIO_LIT
: return D3DSIO_LIT
;
495 case BWRITERSIO_DST
: return D3DSIO_DST
;
496 case BWRITERSIO_LRP
: return D3DSIO_LRP
;
497 case BWRITERSIO_FRC
: return D3DSIO_FRC
;
498 case BWRITERSIO_M4x4
: return D3DSIO_M4x4
;
499 case BWRITERSIO_M4x3
: return D3DSIO_M4x3
;
500 case BWRITERSIO_M3x4
: return D3DSIO_M3x4
;
501 case BWRITERSIO_M3x3
: return D3DSIO_M3x3
;
502 case BWRITERSIO_M3x2
: return D3DSIO_M3x2
;
503 case BWRITERSIO_CALL
: return D3DSIO_CALL
;
504 case BWRITERSIO_CALLNZ
: return D3DSIO_CALLNZ
;
505 case BWRITERSIO_LOOP
: return D3DSIO_LOOP
;
506 case BWRITERSIO_RET
: return D3DSIO_RET
;
507 case BWRITERSIO_ENDLOOP
: return D3DSIO_ENDLOOP
;
508 case BWRITERSIO_LABEL
: return D3DSIO_LABEL
;
509 case BWRITERSIO_DCL
: return D3DSIO_DCL
;
510 case BWRITERSIO_POW
: return D3DSIO_POW
;
511 case BWRITERSIO_CRS
: return D3DSIO_CRS
;
512 case BWRITERSIO_SGN
: return D3DSIO_SGN
;
513 case BWRITERSIO_ABS
: return D3DSIO_ABS
;
514 case BWRITERSIO_NRM
: return D3DSIO_NRM
;
515 case BWRITERSIO_SINCOS
: return D3DSIO_SINCOS
;
516 case BWRITERSIO_REP
: return D3DSIO_REP
;
517 case BWRITERSIO_ENDREP
: return D3DSIO_ENDREP
;
518 case BWRITERSIO_IF
: return D3DSIO_IF
;
519 case BWRITERSIO_IFC
: return D3DSIO_IFC
;
520 case BWRITERSIO_ELSE
: return D3DSIO_ELSE
;
521 case BWRITERSIO_ENDIF
: return D3DSIO_ENDIF
;
522 case BWRITERSIO_BREAK
: return D3DSIO_BREAK
;
523 case BWRITERSIO_BREAKC
: return D3DSIO_BREAKC
;
524 case BWRITERSIO_MOVA
: return D3DSIO_MOVA
;
525 case BWRITERSIO_DEFB
: return D3DSIO_DEFB
;
526 case BWRITERSIO_DEFI
: return D3DSIO_DEFI
;
528 case BWRITERSIO_TEXCOORD
: return D3DSIO_TEXCOORD
;
529 case BWRITERSIO_TEXKILL
: return D3DSIO_TEXKILL
;
530 case BWRITERSIO_TEX
: return D3DSIO_TEX
;
531 case BWRITERSIO_TEXBEM
: return D3DSIO_TEXBEM
;
532 case BWRITERSIO_TEXBEML
: return D3DSIO_TEXBEML
;
533 case BWRITERSIO_TEXREG2AR
: return D3DSIO_TEXREG2AR
;
534 case BWRITERSIO_TEXREG2GB
: return D3DSIO_TEXREG2GB
;
535 case BWRITERSIO_TEXM3x2PAD
: return D3DSIO_TEXM3x2PAD
;
536 case BWRITERSIO_TEXM3x2TEX
: return D3DSIO_TEXM3x2TEX
;
537 case BWRITERSIO_TEXM3x3PAD
: return D3DSIO_TEXM3x3PAD
;
538 case BWRITERSIO_TEXM3x3TEX
: return D3DSIO_TEXM3x3TEX
;
539 case BWRITERSIO_TEXM3x3SPEC
: return D3DSIO_TEXM3x3SPEC
;
540 case BWRITERSIO_TEXM3x3VSPEC
:return D3DSIO_TEXM3x3VSPEC
;
541 case BWRITERSIO_EXPP
: return D3DSIO_EXPP
;
542 case BWRITERSIO_LOGP
: return D3DSIO_LOGP
;
543 case BWRITERSIO_CND
: return D3DSIO_CND
;
544 case BWRITERSIO_DEF
: return D3DSIO_DEF
;
545 case BWRITERSIO_TEXREG2RGB
: return D3DSIO_TEXREG2RGB
;
546 case BWRITERSIO_TEXDP3TEX
: return D3DSIO_TEXDP3TEX
;
547 case BWRITERSIO_TEXM3x2DEPTH
:return D3DSIO_TEXM3x2DEPTH
;
548 case BWRITERSIO_TEXDP3
: return D3DSIO_TEXDP3
;
549 case BWRITERSIO_TEXM3x3
: return D3DSIO_TEXM3x3
;
550 case BWRITERSIO_TEXDEPTH
: return D3DSIO_TEXDEPTH
;
551 case BWRITERSIO_CMP
: return D3DSIO_CMP
;
552 case BWRITERSIO_BEM
: return D3DSIO_BEM
;
553 case BWRITERSIO_DP2ADD
: return D3DSIO_DP2ADD
;
554 case BWRITERSIO_DSX
: return D3DSIO_DSX
;
555 case BWRITERSIO_DSY
: return D3DSIO_DSY
;
556 case BWRITERSIO_TEXLDD
: return D3DSIO_TEXLDD
;
557 case BWRITERSIO_SETP
: return D3DSIO_SETP
;
558 case BWRITERSIO_TEXLDL
: return D3DSIO_TEXLDL
;
559 case BWRITERSIO_BREAKP
: return D3DSIO_BREAKP
;
561 case BWRITERSIO_PHASE
: return D3DSIO_PHASE
;
562 case BWRITERSIO_COMMENT
: return D3DSIO_COMMENT
;
563 case BWRITERSIO_END
: return D3DSIO_END
;
565 case BWRITERSIO_TEXLDP
: return D3DSIO_TEX
| D3DSI_TEXLD_PROJECT
;
566 case BWRITERSIO_TEXLDB
: return D3DSIO_TEX
| D3DSI_TEXLD_BIAS
;
569 FIXME("Unhandled BWRITERSIO token %#x.\n", bwriter_opcode
);
574 /******************************************************
575 * Implementation of the writer functions starts here *
576 ******************************************************/
577 static void write_declarations(struct bc_writer
*This
,
578 struct bytecode_buffer
*buffer
, BOOL len
,
579 const struct declaration
*decls
, unsigned int num
, DWORD type
) {
581 DWORD instr_dcl
= D3DSIO_DCL
;
583 struct shader_reg reg
;
585 ZeroMemory(®
, sizeof(reg
));
588 instr_dcl
|= 2 << D3DSI_INSTLENGTH_SHIFT
;
591 for(i
= 0; i
< num
; i
++) {
592 if(decls
[i
].builtin
) continue;
594 /* Write the DCL instruction */
595 put_dword(buffer
, instr_dcl
);
597 /* Write the usage and index */
598 token
= (1 << 31); /* Bit 31 of non-instruction opcodes is 1 */
599 token
|= (decls
[i
].usage
<< D3DSP_DCL_USAGE_SHIFT
) & D3DSP_DCL_USAGE_MASK
;
600 token
|= (decls
[i
].usage_idx
<< D3DSP_DCL_USAGEINDEX_SHIFT
) & D3DSP_DCL_USAGEINDEX_MASK
;
601 put_dword(buffer
, token
);
603 /* Write the dest register */
605 reg
.regnum
= decls
[i
].regnum
;
606 reg
.u
.writemask
= decls
[i
].writemask
;
607 This
->funcs
->dstreg(This
, ®
, buffer
, 0, decls
[i
].mod
);
611 static void write_const(struct constant
**consts
, int num
, DWORD opcode
, DWORD reg_type
, struct bytecode_buffer
*buffer
, BOOL len
) {
613 DWORD instr_def
= opcode
;
614 const DWORD reg
= (1<<31) |
615 ((reg_type
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
) |
616 ((reg_type
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
) |
620 if(opcode
== D3DSIO_DEFB
)
621 instr_def
|= 2 << D3DSI_INSTLENGTH_SHIFT
;
623 instr_def
|= 5 << D3DSI_INSTLENGTH_SHIFT
;
626 for(i
= 0; i
< num
; i
++) {
627 /* Write the DEF instruction */
628 put_dword(buffer
, instr_def
);
630 put_dword(buffer
, reg
| (consts
[i
]->regnum
& D3DSP_REGNUM_MASK
));
631 put_dword(buffer
, consts
[i
]->value
[0].d
);
632 if(opcode
!= D3DSIO_DEFB
) {
633 put_dword(buffer
, consts
[i
]->value
[1].d
);
634 put_dword(buffer
, consts
[i
]->value
[2].d
);
635 put_dword(buffer
, consts
[i
]->value
[3].d
);
640 static void write_constF(const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
, BOOL len
) {
641 write_const(shader
->constF
, shader
->num_cf
, D3DSIO_DEF
, D3DSPR_CONST
, buffer
, len
);
644 /* This function looks for VS 1/2 registers mapping to VS 3 output registers */
645 static HRESULT
vs_find_builtin_varyings(struct bc_writer
*This
, const struct bwriter_shader
*shader
) {
647 DWORD usage
, usage_idx
, writemask
, regnum
;
649 for(i
= 0; i
< shader
->num_outputs
; i
++) {
650 if(!shader
->outputs
[i
].builtin
) continue;
652 usage
= shader
->outputs
[i
].usage
;
653 usage_idx
= shader
->outputs
[i
].usage_idx
;
654 writemask
= shader
->outputs
[i
].writemask
;
655 regnum
= shader
->outputs
[i
].regnum
;
658 case BWRITERDECLUSAGE_POSITION
:
659 case BWRITERDECLUSAGE_POSITIONT
:
661 WARN("dcl_position%u not supported in sm 1/2 shaders\n", usage_idx
);
664 TRACE("o%u is oPos\n", regnum
);
665 This
->oPos_regnum
= regnum
;
668 case BWRITERDECLUSAGE_COLOR
:
670 WARN("dcl_color%u not supported in sm 1/2 shaders\n", usage_idx
);
673 if(writemask
!= BWRITERSP_WRITEMASK_ALL
) {
674 WARN("Only WRITEMASK_ALL is supported on color in sm 1/2\n");
677 TRACE("o%u is oD%u\n", regnum
, usage_idx
);
678 This
->oD_regnum
[usage_idx
] = regnum
;
681 case BWRITERDECLUSAGE_TEXCOORD
:
683 WARN("dcl_color%u not supported in sm 1/2 shaders\n", usage_idx
);
686 if(writemask
!= (BWRITERSP_WRITEMASK_0
) &&
687 writemask
!= (BWRITERSP_WRITEMASK_0
| BWRITERSP_WRITEMASK_1
) &&
688 writemask
!= (BWRITERSP_WRITEMASK_0
| BWRITERSP_WRITEMASK_1
| BWRITERSP_WRITEMASK_2
) &&
689 writemask
!= (BWRITERSP_WRITEMASK_ALL
)) {
690 WARN("Partial writemasks not supported on texture coordinates in sm 1 and 2\n");
693 TRACE("o%u is oT%u\n", regnum
, usage_idx
);
694 This
->oT_regnum
[usage_idx
] = regnum
;
697 case BWRITERDECLUSAGE_PSIZE
:
699 WARN("dcl_psize%u not supported in sm 1/2 shaders\n", usage_idx
);
702 TRACE("o%u writemask 0x%08x is oPts\n", regnum
, writemask
);
703 This
->oPts_regnum
= regnum
;
704 This
->oPts_mask
= writemask
;
707 case BWRITERDECLUSAGE_FOG
:
709 WARN("dcl_fog%u not supported in sm 1 shaders\n", usage_idx
);
712 if(writemask
!= BWRITERSP_WRITEMASK_0
&& writemask
!= BWRITERSP_WRITEMASK_1
&&
713 writemask
!= BWRITERSP_WRITEMASK_2
&& writemask
!= BWRITERSP_WRITEMASK_3
) {
714 WARN("Unsupported fog writemask\n");
717 TRACE("o%u writemask 0x%08x is oFog\n", regnum
, writemask
);
718 This
->oFog_regnum
= regnum
;
719 This
->oFog_mask
= writemask
;
723 WARN("Varying type %u is not supported in shader model 1.x\n", usage
);
731 static void vs_1_x_header(struct bc_writer
*This
, const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
) {
734 if(shader
->num_ci
|| shader
->num_cb
) {
735 WARN("Int and bool constants are not supported in shader model 1 shaders\n");
736 WARN("Got %u int and %u boolean constants\n", shader
->num_ci
, shader
->num_cb
);
737 This
->state
= E_INVALIDARG
;
741 hr
= vs_find_builtin_varyings(This
, shader
);
747 write_declarations(This
, buffer
, FALSE
, shader
->inputs
, shader
->num_inputs
, BWRITERSPR_INPUT
);
748 write_constF(shader
, buffer
, FALSE
);
751 static HRESULT
find_ps_builtin_semantics(struct bc_writer
*This
,
752 const struct bwriter_shader
*shader
,
755 DWORD usage
, usage_idx
, writemask
, regnum
;
757 This
->v_regnum
[0] = -1; This
->v_regnum
[1] = -1;
758 for(i
= 0; i
< 8; i
++) This
->t_regnum
[i
] = -1;
760 for(i
= 0; i
< shader
->num_inputs
; i
++) {
761 if(!shader
->inputs
[i
].builtin
) continue;
763 usage
= shader
->inputs
[i
].usage
;
764 usage_idx
= shader
->inputs
[i
].usage_idx
;
765 writemask
= shader
->inputs
[i
].writemask
;
766 regnum
= shader
->inputs
[i
].regnum
;
769 case BWRITERDECLUSAGE_COLOR
:
771 WARN("dcl_color%u not supported in sm 1 shaders\n", usage_idx
);
774 if(writemask
!= BWRITERSP_WRITEMASK_ALL
) {
775 WARN("Only WRITEMASK_ALL is supported on color in sm 1\n");
778 TRACE("v%u is v%u\n", regnum
, usage_idx
);
779 This
->v_regnum
[usage_idx
] = regnum
;
782 case BWRITERDECLUSAGE_TEXCOORD
:
783 if(usage_idx
> texcoords
) {
784 WARN("dcl_texcoord%u not supported in this shader version\n", usage_idx
);
787 if(writemask
!= (BWRITERSP_WRITEMASK_0
) &&
788 writemask
!= (BWRITERSP_WRITEMASK_0
| BWRITERSP_WRITEMASK_1
) &&
789 writemask
!= (BWRITERSP_WRITEMASK_0
| BWRITERSP_WRITEMASK_1
| BWRITERSP_WRITEMASK_2
) &&
790 writemask
!= (BWRITERSP_WRITEMASK_ALL
)) {
791 WARN("Partial writemasks not supported on texture coordinates in sm 1 and 2\n");
793 writemask
= BWRITERSP_WRITEMASK_ALL
;
795 TRACE("v%u is t%u\n", regnum
, usage_idx
);
796 This
->t_regnum
[usage_idx
] = regnum
;
800 WARN("Varying type %u is not supported in shader model 1.x\n", usage
);
808 static void ps_1_x_header(struct bc_writer
*This
, const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
) {
811 /* First check the constants and varyings, and complain if unsupported things are used */
812 if(shader
->num_ci
|| shader
->num_cb
) {
813 WARN("Int and bool constants are not supported in shader model 1 shaders\n");
814 WARN("Got %u int and %u boolean constants\n", shader
->num_ci
, shader
->num_cb
);
815 This
->state
= E_INVALIDARG
;
819 hr
= find_ps_builtin_semantics(This
, shader
, 4);
825 write_constF(shader
, buffer
, FALSE
);
828 static void ps_1_4_header(struct bc_writer
*This
, const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
) {
831 /* First check the constants and varyings, and complain if unsupported things are used */
832 if(shader
->num_ci
|| shader
->num_cb
) {
833 WARN("Int and bool constants are not supported in shader model 1 shaders\n");
834 WARN("Got %u int and %u boolean constants\n", shader
->num_ci
, shader
->num_cb
);
835 This
->state
= E_INVALIDARG
;
838 hr
= find_ps_builtin_semantics(This
, shader
, 6);
844 write_constF(shader
, buffer
, FALSE
);
847 static void end(struct bc_writer
*This
, const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
) {
848 put_dword(buffer
, D3DSIO_END
);
851 static DWORD
map_vs_output(struct bc_writer
*This
, DWORD regnum
, DWORD mask
, DWORD
*has_components
) {
855 *has_components
= TRUE
;
856 if(regnum
== This
->oPos_regnum
) {
857 token
|= (D3DSPR_RASTOUT
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
858 token
|= D3DSRO_POSITION
& D3DSP_REGNUM_MASK
; /* No shift */
861 if(regnum
== This
->oFog_regnum
&& mask
== This
->oFog_mask
) {
862 token
|= (D3DSPR_RASTOUT
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
863 token
|= D3DSRO_FOG
& D3DSP_REGNUM_MASK
; /* No shift */
864 token
|= D3DSP_WRITEMASK_ALL
;
865 *has_components
= FALSE
;
868 if(regnum
== This
->oPts_regnum
&& mask
== This
->oPts_mask
) {
869 token
|= (D3DSPR_RASTOUT
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
870 token
|= D3DSRO_POINT_SIZE
& D3DSP_REGNUM_MASK
; /* No shift */
871 token
|= D3DSP_WRITEMASK_ALL
;
872 *has_components
= FALSE
;
875 for(i
= 0; i
< 2; i
++) {
876 if(regnum
== This
->oD_regnum
[i
]) {
877 token
|= (D3DSPR_ATTROUT
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
878 token
|= i
& D3DSP_REGNUM_MASK
; /* No shift */
882 for(i
= 0; i
< 8; i
++) {
883 if(regnum
== This
->oT_regnum
[i
]) {
884 token
|= (D3DSPR_TEXCRDOUT
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
885 token
|= i
& D3DSP_REGNUM_MASK
; /* No shift */
890 /* The varying must be undeclared - if an unsupported varying was declared,
891 * the vs_find_builtin_varyings function would have caught it and this code
893 WARN("Undeclared varying %u\n", regnum
);
894 This
->state
= E_INVALIDARG
;
898 static void vs_12_dstreg(struct bc_writer
*This
, const struct shader_reg
*reg
,
899 struct bytecode_buffer
*buffer
,
900 DWORD shift
, DWORD mod
) {
901 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
905 WARN("Relative addressing not supported for destination registers\n");
906 This
->state
= E_INVALIDARG
;
911 case BWRITERSPR_OUTPUT
:
912 token
|= map_vs_output(This
, reg
->regnum
, reg
->u
.writemask
, &has_wmask
);
915 case BWRITERSPR_RASTOUT
:
916 case BWRITERSPR_ATTROUT
:
917 /* These registers are mapped to input and output regs. They can be encoded in the bytecode,
918 * but are unexpected. If we hit this path it might be due to an error.
920 FIXME("Unexpected register type %u\n", reg
->type
);
922 case BWRITERSPR_INPUT
:
923 case BWRITERSPR_TEMP
:
924 case BWRITERSPR_CONST
:
925 token
|= (reg
->type
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
926 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
930 case BWRITERSPR_ADDR
:
931 if(reg
->regnum
!= 0) {
932 WARN("Only a0 exists\n");
933 This
->state
= E_INVALIDARG
;
936 token
|= (D3DSPR_ADDR
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
937 token
|= 0 & D3DSP_REGNUM_MASK
; /* No shift */
941 case BWRITERSPR_PREDICATE
:
942 if(This
->version
!= BWRITERVS_VERSION(2, 1)){
943 WARN("Predicate register is allowed only in vs_2_x\n");
944 This
->state
= E_INVALIDARG
;
947 if(reg
->regnum
!= 0) {
948 WARN("Only predicate register p0 exists\n");
949 This
->state
= E_INVALIDARG
;
952 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
953 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
954 token
|= 0 & D3DSP_REGNUM_MASK
; /* No shift */
959 WARN("Invalid register type for 1.x-2.x vertex shader\n");
960 This
->state
= E_INVALIDARG
;
964 /* strictly speaking there are no modifiers in vs_2_0 and vs_1_x, but they can be written
965 * into the bytecode and since the compiler doesn't do such checks write them
966 * (the checks are done by the undocumented shader validator)
968 token
|= (shift
<< D3DSP_DSTSHIFT_SHIFT
) & D3DSP_DSTSHIFT_MASK
;
969 token
|= d3d9_dstmod(mod
);
972 token
|= d3d9_writemask(reg
->u
.writemask
);
974 put_dword(buffer
, token
);
977 static void vs_1_x_srcreg(struct bc_writer
*This
, const struct shader_reg
*reg
,
978 struct bytecode_buffer
*buffer
) {
979 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
984 case BWRITERSPR_OUTPUT
:
985 /* Map the swizzle to a writemask, the format expected
988 switch(reg
->u
.swizzle
) {
989 case BWRITERVS_SWIZZLE_X
:
990 component
= BWRITERSP_WRITEMASK_0
;
992 case BWRITERVS_SWIZZLE_Y
:
993 component
= BWRITERSP_WRITEMASK_1
;
995 case BWRITERVS_SWIZZLE_Z
:
996 component
= BWRITERSP_WRITEMASK_2
;
998 case BWRITERVS_SWIZZLE_W
:
999 component
= BWRITERSP_WRITEMASK_3
;
1004 token
|= map_vs_output(This
, reg
->regnum
, component
, &has_swizzle
);
1007 case BWRITERSPR_RASTOUT
:
1008 case BWRITERSPR_ATTROUT
:
1009 /* These registers are mapped to input and output regs. They can be encoded in the bytecode,
1010 * but are unexpected. If we hit this path it might be due to an error.
1012 FIXME("Unexpected register type %u\n", reg
->type
);
1014 case BWRITERSPR_INPUT
:
1015 case BWRITERSPR_TEMP
:
1016 case BWRITERSPR_CONST
:
1017 case BWRITERSPR_ADDR
:
1018 token
|= (reg
->type
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1019 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1021 if(reg
->rel_reg
->type
!= BWRITERSPR_ADDR
||
1022 reg
->rel_reg
->regnum
!= 0 ||
1023 reg
->rel_reg
->u
.swizzle
!= BWRITERVS_SWIZZLE_X
) {
1024 WARN("Relative addressing in vs_1_x is only allowed with a0.x\n");
1025 This
->state
= E_INVALIDARG
;
1028 token
|= D3DVS_ADDRMODE_RELATIVE
& D3DVS_ADDRESSMODE_MASK
;
1033 WARN("Invalid register type for 1.x vshader\n");
1034 This
->state
= E_INVALIDARG
;
1038 token
|= d3d9_swizzle(reg
->u
.swizzle
) & D3DVS_SWIZZLE_MASK
; /* already shifted */
1040 token
|= d3d9_srcmod(reg
->srcmod
);
1041 put_dword(buffer
, token
);
1044 static void write_srcregs(struct bc_writer
*This
, const struct instruction
*instr
,
1045 struct bytecode_buffer
*buffer
){
1047 if(instr
->has_predicate
){
1048 This
->funcs
->srcreg(This
, &instr
->predicate
, buffer
);
1050 for(i
= 0; i
< instr
->num_srcs
; i
++){
1051 This
->funcs
->srcreg(This
, &instr
->src
[i
], buffer
);
1055 static DWORD
map_ps13_temp(struct bc_writer
*This
, const struct shader_reg
*reg
) {
1057 if(reg
->regnum
== T0_REG
) {
1058 token
|= (D3DSPR_TEXTURE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1059 token
|= 0 & D3DSP_REGNUM_MASK
; /* No shift */
1060 } else if(reg
->regnum
== T1_REG
) {
1061 token
|= (D3DSPR_TEXTURE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1062 token
|= 1 & D3DSP_REGNUM_MASK
; /* No shift */
1063 } else if(reg
->regnum
== T2_REG
) {
1064 token
|= (D3DSPR_TEXTURE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1065 token
|= 2 & D3DSP_REGNUM_MASK
; /* No shift */
1066 } else if(reg
->regnum
== T3_REG
) {
1067 token
|= (D3DSPR_TEXTURE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1068 token
|= 3 & D3DSP_REGNUM_MASK
; /* No shift */
1070 token
|= (D3DSPR_TEMP
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1071 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1076 static DWORD
map_ps_input(struct bc_writer
*This
,
1077 const struct shader_reg
*reg
) {
1079 /* Map color interpolators */
1080 for(i
= 0; i
< 2; i
++) {
1081 if(reg
->regnum
== This
->v_regnum
[i
]) {
1082 token
|= (D3DSPR_INPUT
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1083 token
|= i
& D3DSP_REGNUM_MASK
; /* No shift */
1087 for(i
= 0; i
< 8; i
++) {
1088 if(reg
->regnum
== This
->t_regnum
[i
]) {
1089 token
|= (D3DSPR_TEXTURE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1090 token
|= i
& D3DSP_REGNUM_MASK
; /* No shift */
1095 WARN("Invalid ps 1/2 varying\n");
1096 This
->state
= E_INVALIDARG
;
1100 static void ps_1_0123_srcreg(struct bc_writer
*This
, const struct shader_reg
*reg
,
1101 struct bytecode_buffer
*buffer
) {
1102 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
1104 WARN("Relative addressing not supported in <= ps_3_0\n");
1105 This
->state
= E_INVALIDARG
;
1110 case BWRITERSPR_INPUT
:
1111 token
|= map_ps_input(This
, reg
);
1114 /* Take care about the texture temporaries. There's a problem: They aren't
1115 * declared anywhere, so we can only hardcode the values that are used
1116 * to map ps_1_3 shaders to the common shader structure
1118 case BWRITERSPR_TEMP
:
1119 token
|= map_ps13_temp(This
, reg
);
1122 case BWRITERSPR_CONST
: /* Can be mapped 1:1 */
1123 token
|= (reg
->type
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1124 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1128 WARN("Invalid register type for <= ps_1_3 shader\n");
1129 This
->state
= E_INVALIDARG
;
1133 token
|= d3d9_swizzle(reg
->u
.swizzle
) & D3DVS_SWIZZLE_MASK
; /* already shifted */
1135 if(reg
->srcmod
== BWRITERSPSM_DZ
|| reg
->srcmod
== BWRITERSPSM_DW
||
1136 reg
->srcmod
== BWRITERSPSM_ABS
|| reg
->srcmod
== BWRITERSPSM_ABSNEG
||
1137 reg
->srcmod
== BWRITERSPSM_NOT
) {
1138 WARN("Invalid source modifier %u for <= ps_1_3\n", reg
->srcmod
);
1139 This
->state
= E_INVALIDARG
;
1142 token
|= d3d9_srcmod(reg
->srcmod
);
1143 put_dword(buffer
, token
);
1146 static void ps_1_0123_dstreg(struct bc_writer
*This
, const struct shader_reg
*reg
,
1147 struct bytecode_buffer
*buffer
,
1148 DWORD shift
, DWORD mod
) {
1149 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
1152 WARN("Relative addressing not supported for destination registers\n");
1153 This
->state
= E_INVALIDARG
;
1158 case BWRITERSPR_TEMP
:
1159 token
|= map_ps13_temp(This
, reg
);
1162 /* texkill uses the input register as a destination parameter */
1163 case BWRITERSPR_INPUT
:
1164 token
|= map_ps_input(This
, reg
);
1168 WARN("Invalid dest register type for 1.x pshader\n");
1169 This
->state
= E_INVALIDARG
;
1173 token
|= (shift
<< D3DSP_DSTSHIFT_SHIFT
) & D3DSP_DSTSHIFT_MASK
;
1174 token
|= d3d9_dstmod(mod
);
1176 token
|= d3d9_writemask(reg
->u
.writemask
);
1177 put_dword(buffer
, token
);
1180 /* The length of an instruction consists of the destination register (if any),
1181 * the number of source registers, the number of address registers used for
1182 * indirect addressing, and optionally the predicate register
1184 static DWORD
instrlen(const struct instruction
*instr
, unsigned int srcs
, unsigned int dsts
) {
1186 DWORD ret
= srcs
+ dsts
+ (instr
->has_predicate
? 1 : 0);
1189 if(instr
->dst
.rel_reg
) ret
++;
1191 for(i
= 0; i
< srcs
; i
++) {
1192 if(instr
->src
[i
].rel_reg
) ret
++;
1197 static void sm_1_x_opcode(struct bc_writer
*This
,
1198 const struct instruction
*instr
,
1199 DWORD token
, struct bytecode_buffer
*buffer
) {
1200 /* In sm_1_x instruction length isn't encoded */
1202 token
|= D3DSI_COISSUE
;
1204 put_dword(buffer
, token
);
1207 static void instr_handler(struct bc_writer
*This
,
1208 const struct instruction
*instr
,
1209 struct bytecode_buffer
*buffer
) {
1210 DWORD token
= d3d9_opcode(instr
->opcode
);
1212 This
->funcs
->opcode(This
, instr
, token
, buffer
);
1213 if(instr
->has_dst
) This
->funcs
->dstreg(This
, &instr
->dst
, buffer
, instr
->shift
, instr
->dstmod
);
1214 write_srcregs(This
, instr
, buffer
);
1217 static const struct instr_handler_table vs_1_x_handlers
[] = {
1218 {BWRITERSIO_ADD
, instr_handler
},
1219 {BWRITERSIO_NOP
, instr_handler
},
1220 {BWRITERSIO_MOV
, instr_handler
},
1221 {BWRITERSIO_SUB
, instr_handler
},
1222 {BWRITERSIO_MAD
, instr_handler
},
1223 {BWRITERSIO_MUL
, instr_handler
},
1224 {BWRITERSIO_RCP
, instr_handler
},
1225 {BWRITERSIO_RSQ
, instr_handler
},
1226 {BWRITERSIO_DP3
, instr_handler
},
1227 {BWRITERSIO_DP4
, instr_handler
},
1228 {BWRITERSIO_MIN
, instr_handler
},
1229 {BWRITERSIO_MAX
, instr_handler
},
1230 {BWRITERSIO_SLT
, instr_handler
},
1231 {BWRITERSIO_SGE
, instr_handler
},
1232 {BWRITERSIO_EXP
, instr_handler
},
1233 {BWRITERSIO_LOG
, instr_handler
},
1234 {BWRITERSIO_EXPP
, instr_handler
},
1235 {BWRITERSIO_LOGP
, instr_handler
},
1236 {BWRITERSIO_DST
, instr_handler
},
1237 {BWRITERSIO_FRC
, instr_handler
},
1238 {BWRITERSIO_M4x4
, instr_handler
},
1239 {BWRITERSIO_M4x3
, instr_handler
},
1240 {BWRITERSIO_M3x4
, instr_handler
},
1241 {BWRITERSIO_M3x3
, instr_handler
},
1242 {BWRITERSIO_M3x2
, instr_handler
},
1243 {BWRITERSIO_LIT
, instr_handler
},
1245 {BWRITERSIO_END
, NULL
}, /* Sentinel value, it signals
1246 the end of the list */
1249 static const struct bytecode_backend vs_1_x_backend
= {
1258 static void instr_ps_1_0123_texld(struct bc_writer
*This
,
1259 const struct instruction
*instr
,
1260 struct bytecode_buffer
*buffer
) {
1262 struct shader_reg reg
;
1265 if(instr
->src
[1].type
!= BWRITERSPR_SAMPLER
||
1266 instr
->src
[1].regnum
> 3) {
1267 WARN("Unsupported sampler type %u regnum %u\n",
1268 instr
->src
[1].type
, instr
->src
[1].regnum
);
1269 This
->state
= E_INVALIDARG
;
1271 } else if(instr
->dst
.type
!= BWRITERSPR_TEMP
) {
1272 WARN("Can only sample into a temp register\n");
1273 This
->state
= E_INVALIDARG
;
1277 idx
= instr
->src
[1].regnum
;
1278 if((idx
== 0 && instr
->dst
.regnum
!= T0_REG
) ||
1279 (idx
== 1 && instr
->dst
.regnum
!= T1_REG
) ||
1280 (idx
== 2 && instr
->dst
.regnum
!= T2_REG
) ||
1281 (idx
== 3 && instr
->dst
.regnum
!= T3_REG
)) {
1282 WARN("Sampling from sampler s%u to register r%u is not possible in ps_1_x\n",
1283 idx
, instr
->dst
.regnum
);
1284 This
->state
= E_INVALIDARG
;
1287 if(instr
->src
[0].type
== BWRITERSPR_INPUT
) {
1288 /* A simple non-dependent read tex instruction */
1289 if(instr
->src
[0].regnum
!= This
->t_regnum
[idx
]) {
1290 WARN("Cannot sample from s%u with texture address data from interpolator %u\n",
1291 idx
, instr
->src
[0].regnum
);
1292 This
->state
= E_INVALIDARG
;
1295 This
->funcs
->opcode(This
, instr
, D3DSIO_TEX
& D3DSI_OPCODE_MASK
, buffer
);
1297 /* map the temp dstreg to the ps_1_3 texture temporary register */
1298 This
->funcs
->dstreg(This
, &instr
->dst
, buffer
, instr
->shift
, instr
->dstmod
);
1299 } else if(instr
->src
[0].type
== BWRITERSPR_TEMP
) {
1301 swizzlemask
= (3 << BWRITERVS_SWIZZLE_SHIFT
) |
1302 (3 << (BWRITERVS_SWIZZLE_SHIFT
+ 2)) |
1303 (3 << (BWRITERVS_SWIZZLE_SHIFT
+ 4));
1304 if((instr
->src
[0].u
.swizzle
& swizzlemask
) == (BWRITERVS_X_X
| BWRITERVS_Y_Y
| BWRITERVS_Z_Z
)) {
1305 TRACE("writing texreg2rgb\n");
1306 This
->funcs
->opcode(This
, instr
, D3DSIO_TEXREG2RGB
& D3DSI_OPCODE_MASK
, buffer
);
1307 } else if(instr
->src
[0].u
.swizzle
== (BWRITERVS_X_W
| BWRITERVS_Y_X
| BWRITERVS_Z_X
| BWRITERVS_W_X
)) {
1308 TRACE("writing texreg2ar\n");
1309 This
->funcs
->opcode(This
, instr
, D3DSIO_TEXREG2AR
& D3DSI_OPCODE_MASK
, buffer
);
1310 } else if(instr
->src
[0].u
.swizzle
== (BWRITERVS_X_Y
| BWRITERVS_Y_Z
| BWRITERVS_Z_Z
| BWRITERVS_W_Z
)) {
1311 TRACE("writing texreg2gb\n");
1312 This
->funcs
->opcode(This
, instr
, D3DSIO_TEXREG2GB
& D3DSI_OPCODE_MASK
, buffer
);
1314 WARN("Unsupported src addr swizzle in dependent texld: 0x%08x\n", instr
->src
[0].u
.swizzle
);
1315 This
->state
= E_INVALIDARG
;
1319 /* Dst and src reg can be mapped normally. Both registers are temporary registers in the
1320 * source shader and have to be mapped to the temporary form of the texture registers. However,
1321 * the src reg doesn't have a swizzle
1323 This
->funcs
->dstreg(This
, &instr
->dst
, buffer
, instr
->shift
, instr
->dstmod
);
1324 reg
= instr
->src
[0];
1325 reg
.u
.swizzle
= BWRITERVS_NOSWIZZLE
;
1326 This
->funcs
->srcreg(This
, ®
, buffer
);
1328 WARN("Invalid address data source register\n");
1329 This
->state
= E_INVALIDARG
;
1334 static void instr_ps_1_0123_mov(struct bc_writer
*This
,
1335 const struct instruction
*instr
,
1336 struct bytecode_buffer
*buffer
) {
1337 DWORD token
= D3DSIO_MOV
& D3DSI_OPCODE_MASK
;
1339 if(instr
->dst
.type
== BWRITERSPR_TEMP
&& instr
->src
[0].type
== BWRITERSPR_INPUT
) {
1340 if((instr
->dst
.regnum
== T0_REG
&& instr
->src
[0].regnum
== This
->t_regnum
[0]) ||
1341 (instr
->dst
.regnum
== T1_REG
&& instr
->src
[0].regnum
== This
->t_regnum
[1]) ||
1342 (instr
->dst
.regnum
== T2_REG
&& instr
->src
[0].regnum
== This
->t_regnum
[2]) ||
1343 (instr
->dst
.regnum
== T3_REG
&& instr
->src
[0].regnum
== This
->t_regnum
[3])) {
1344 if(instr
->dstmod
& BWRITERSPDM_SATURATE
) {
1345 This
->funcs
->opcode(This
, instr
, D3DSIO_TEXCOORD
& D3DSI_OPCODE_MASK
, buffer
);
1346 /* Remove the SATURATE flag, it's implicit to the instruction */
1347 This
->funcs
->dstreg(This
, &instr
->dst
, buffer
, instr
->shift
, instr
->dstmod
& (~BWRITERSPDM_SATURATE
));
1350 WARN("A varying -> temp copy is only supported with the SATURATE modifier in <=ps_1_3\n");
1351 This
->state
= E_INVALIDARG
;
1354 } else if(instr
->src
[0].regnum
== This
->v_regnum
[0] ||
1355 instr
->src
[0].regnum
== This
->v_regnum
[1]) {
1356 /* Handled by the normal mov below. Just drop out of the if condition */
1358 WARN("Unsupported varying -> temp mov in <= ps_1_3\n");
1359 This
->state
= E_INVALIDARG
;
1364 This
->funcs
->opcode(This
, instr
, token
, buffer
);
1365 This
->funcs
->dstreg(This
, &instr
->dst
, buffer
, instr
->shift
, instr
->dstmod
);
1366 This
->funcs
->srcreg(This
, &instr
->src
[0], buffer
);
1369 static const struct instr_handler_table ps_1_0123_handlers
[] = {
1370 {BWRITERSIO_ADD
, instr_handler
},
1371 {BWRITERSIO_NOP
, instr_handler
},
1372 {BWRITERSIO_MOV
, instr_ps_1_0123_mov
},
1373 {BWRITERSIO_SUB
, instr_handler
},
1374 {BWRITERSIO_MAD
, instr_handler
},
1375 {BWRITERSIO_MUL
, instr_handler
},
1376 {BWRITERSIO_DP3
, instr_handler
},
1377 {BWRITERSIO_DP4
, instr_handler
},
1378 {BWRITERSIO_LRP
, instr_handler
},
1380 /* pshader instructions */
1381 {BWRITERSIO_CND
, instr_handler
},
1382 {BWRITERSIO_CMP
, instr_handler
},
1383 {BWRITERSIO_TEXKILL
, instr_handler
},
1384 {BWRITERSIO_TEX
, instr_ps_1_0123_texld
},
1385 {BWRITERSIO_TEXBEM
, instr_handler
},
1386 {BWRITERSIO_TEXBEML
, instr_handler
},
1387 {BWRITERSIO_TEXM3x2PAD
, instr_handler
},
1388 {BWRITERSIO_TEXM3x3PAD
, instr_handler
},
1389 {BWRITERSIO_TEXM3x3SPEC
, instr_handler
},
1390 {BWRITERSIO_TEXM3x3VSPEC
, instr_handler
},
1391 {BWRITERSIO_TEXM3x3TEX
, instr_handler
},
1392 {BWRITERSIO_TEXM3x3
, instr_handler
},
1393 {BWRITERSIO_TEXM3x2DEPTH
, instr_handler
},
1394 {BWRITERSIO_TEXM3x2TEX
, instr_handler
},
1395 {BWRITERSIO_TEXDP3
, instr_handler
},
1396 {BWRITERSIO_TEXDP3TEX
, instr_handler
},
1397 {BWRITERSIO_END
, NULL
},
1400 static const struct bytecode_backend ps_1_0123_backend
= {
1409 static void ps_1_4_srcreg(struct bc_writer
*This
, const struct shader_reg
*reg
,
1410 struct bytecode_buffer
*buffer
) {
1411 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
1413 WARN("Relative addressing not supported in <= ps_3_0\n");
1414 This
->state
= E_INVALIDARG
;
1419 case BWRITERSPR_INPUT
:
1420 token
|= map_ps_input(This
, reg
);
1423 /* Can be mapped 1:1 */
1424 case BWRITERSPR_TEMP
:
1425 case BWRITERSPR_CONST
:
1426 token
|= (reg
->type
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1427 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1431 WARN("Invalid register type for ps_1_4 shader\n");
1432 This
->state
= E_INVALIDARG
;
1436 token
|= d3d9_swizzle(reg
->u
.swizzle
) & D3DVS_SWIZZLE_MASK
; /* already shifted */
1438 if(reg
->srcmod
== BWRITERSPSM_ABS
|| reg
->srcmod
== BWRITERSPSM_ABSNEG
||
1439 reg
->srcmod
== BWRITERSPSM_NOT
) {
1440 WARN("Invalid source modifier %u for ps_1_4\n", reg
->srcmod
);
1441 This
->state
= E_INVALIDARG
;
1444 token
|= d3d9_srcmod(reg
->srcmod
);
1445 put_dword(buffer
, token
);
1448 static void ps_1_4_dstreg(struct bc_writer
*This
, const struct shader_reg
*reg
,
1449 struct bytecode_buffer
*buffer
,
1450 DWORD shift
, DWORD mod
) {
1451 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
1454 WARN("Relative addressing not supported for destination registers\n");
1455 This
->state
= E_INVALIDARG
;
1460 case BWRITERSPR_TEMP
: /* 1:1 mapping */
1461 token
|= (reg
->type
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1462 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1466 case BWRITERSPR_INPUT
:
1467 token
|= map_ps_input(This
, reg
);
1471 WARN("Invalid dest register type for 1.x pshader\n");
1472 This
->state
= E_INVALIDARG
;
1476 token
|= (shift
<< D3DSP_DSTSHIFT_SHIFT
) & D3DSP_DSTSHIFT_MASK
;
1477 token
|= d3d9_dstmod(mod
);
1479 token
|= d3d9_writemask(reg
->u
.writemask
);
1480 put_dword(buffer
, token
);
1483 static void instr_ps_1_4_mov(struct bc_writer
*This
,
1484 const struct instruction
*instr
,
1485 struct bytecode_buffer
*buffer
) {
1486 DWORD token
= D3DSIO_MOV
& D3DSI_OPCODE_MASK
;
1488 if(instr
->dst
.type
== BWRITERSPR_TEMP
&& instr
->src
[0].type
== BWRITERSPR_INPUT
) {
1489 if(instr
->src
[0].regnum
== This
->t_regnum
[0] ||
1490 instr
->src
[0].regnum
== This
->t_regnum
[1] ||
1491 instr
->src
[0].regnum
== This
->t_regnum
[2] ||
1492 instr
->src
[0].regnum
== This
->t_regnum
[3] ||
1493 instr
->src
[0].regnum
== This
->t_regnum
[4] ||
1494 instr
->src
[0].regnum
== This
->t_regnum
[5]) {
1495 /* Similar to a regular mov, but a different opcode */
1496 token
= D3DSIO_TEXCOORD
& D3DSI_OPCODE_MASK
;
1497 } else if(instr
->src
[0].regnum
== This
->v_regnum
[0] ||
1498 instr
->src
[0].regnum
== This
->v_regnum
[1]) {
1499 /* Handled by the normal mov below. Just drop out of the if condition */
1501 WARN("Unsupported varying -> temp mov in ps_1_4\n");
1502 This
->state
= E_INVALIDARG
;
1507 This
->funcs
->opcode(This
, instr
, token
, buffer
);
1508 This
->funcs
->dstreg(This
, &instr
->dst
, buffer
, instr
->shift
, instr
->dstmod
);
1509 This
->funcs
->srcreg(This
, &instr
->src
[0], buffer
);
1512 static void instr_ps_1_4_texld(struct bc_writer
*This
,
1513 const struct instruction
*instr
,
1514 struct bytecode_buffer
*buffer
) {
1515 if(instr
->src
[1].type
!= BWRITERSPR_SAMPLER
||
1516 instr
->src
[1].regnum
> 5) {
1517 WARN("Unsupported sampler type %u regnum %u\n",
1518 instr
->src
[1].type
, instr
->src
[1].regnum
);
1519 This
->state
= E_INVALIDARG
;
1521 } else if(instr
->dst
.type
!= BWRITERSPR_TEMP
) {
1522 WARN("Can only sample into a temp register\n");
1523 This
->state
= E_INVALIDARG
;
1527 if(instr
->src
[1].regnum
!= instr
->dst
.regnum
) {
1528 WARN("Sampling from sampler s%u to register r%u is not possible in ps_1_4\n",
1529 instr
->src
[1].regnum
, instr
->dst
.regnum
);
1530 This
->state
= E_INVALIDARG
;
1534 This
->funcs
->opcode(This
, instr
, D3DSIO_TEX
& D3DSI_OPCODE_MASK
, buffer
);
1535 This
->funcs
->dstreg(This
, &instr
->dst
, buffer
, instr
->shift
, instr
->dstmod
);
1536 This
->funcs
->srcreg(This
, &instr
->src
[0], buffer
);
1539 static const struct instr_handler_table ps_1_4_handlers
[] = {
1540 {BWRITERSIO_ADD
, instr_handler
},
1541 {BWRITERSIO_NOP
, instr_handler
},
1542 {BWRITERSIO_MOV
, instr_ps_1_4_mov
},
1543 {BWRITERSIO_SUB
, instr_handler
},
1544 {BWRITERSIO_MAD
, instr_handler
},
1545 {BWRITERSIO_MUL
, instr_handler
},
1546 {BWRITERSIO_DP3
, instr_handler
},
1547 {BWRITERSIO_DP4
, instr_handler
},
1548 {BWRITERSIO_LRP
, instr_handler
},
1550 /* pshader instructions */
1551 {BWRITERSIO_CND
, instr_handler
},
1552 {BWRITERSIO_CMP
, instr_handler
},
1553 {BWRITERSIO_TEXKILL
, instr_handler
},
1554 {BWRITERSIO_TEX
, instr_ps_1_4_texld
},
1555 {BWRITERSIO_TEXDEPTH
, instr_handler
},
1556 {BWRITERSIO_BEM
, instr_handler
},
1558 {BWRITERSIO_PHASE
, instr_handler
},
1559 {BWRITERSIO_END
, NULL
},
1562 static const struct bytecode_backend ps_1_4_backend
= {
1571 static void write_constB(const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
, BOOL len
) {
1572 write_const(shader
->constB
, shader
->num_cb
, D3DSIO_DEFB
, D3DSPR_CONSTBOOL
, buffer
, len
);
1575 static void write_constI(const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
, BOOL len
) {
1576 write_const(shader
->constI
, shader
->num_ci
, D3DSIO_DEFI
, D3DSPR_CONSTINT
, buffer
, len
);
1579 static void vs_2_header(struct bc_writer
*This
,
1580 const struct bwriter_shader
*shader
,
1581 struct bytecode_buffer
*buffer
) {
1584 hr
= vs_find_builtin_varyings(This
, shader
);
1590 write_declarations(This
, buffer
, TRUE
, shader
->inputs
, shader
->num_inputs
, BWRITERSPR_INPUT
);
1591 write_constF(shader
, buffer
, TRUE
);
1592 write_constB(shader
, buffer
, TRUE
);
1593 write_constI(shader
, buffer
, TRUE
);
1596 static void vs_2_srcreg(struct bc_writer
*This
,
1597 const struct shader_reg
*reg
,
1598 struct bytecode_buffer
*buffer
) {
1599 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
1605 case BWRITERSPR_OUTPUT
:
1606 /* Map the swizzle to a writemask, the format expected
1609 switch(reg
->u
.swizzle
) {
1610 case BWRITERVS_SWIZZLE_X
:
1611 component
= BWRITERSP_WRITEMASK_0
;
1613 case BWRITERVS_SWIZZLE_Y
:
1614 component
= BWRITERSP_WRITEMASK_1
;
1616 case BWRITERVS_SWIZZLE_Z
:
1617 component
= BWRITERSP_WRITEMASK_2
;
1619 case BWRITERVS_SWIZZLE_W
:
1620 component
= BWRITERSP_WRITEMASK_3
;
1625 token
|= map_vs_output(This
, reg
->regnum
, component
, &has_swizzle
);
1628 case BWRITERSPR_RASTOUT
:
1629 case BWRITERSPR_ATTROUT
:
1630 /* These registers are mapped to input and output regs. They can be encoded in the bytecode,
1631 * but are unexpected. If we hit this path it might be due to an error.
1633 FIXME("Unexpected register type %u\n", reg
->type
);
1635 case BWRITERSPR_INPUT
:
1636 case BWRITERSPR_TEMP
:
1637 case BWRITERSPR_CONST
:
1638 case BWRITERSPR_ADDR
:
1639 case BWRITERSPR_CONSTINT
:
1640 case BWRITERSPR_CONSTBOOL
:
1641 case BWRITERSPR_LABEL
:
1642 d3d9reg
= d3d9_register(reg
->type
);
1643 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1644 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
1645 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1648 case BWRITERSPR_LOOP
:
1649 if(reg
->regnum
!= 0) {
1650 WARN("Only regnum 0 is supported for the loop index register in vs_2_0\n");
1651 This
->state
= E_INVALIDARG
;
1654 token
|= (D3DSPR_LOOP
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1655 token
|= (D3DSPR_LOOP
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
1656 token
|= 0 & D3DSP_REGNUM_MASK
; /* No shift */
1659 case BWRITERSPR_PREDICATE
:
1660 if(This
->version
!= BWRITERVS_VERSION(2, 1)){
1661 WARN("Predicate register is allowed only in vs_2_x\n");
1662 This
->state
= E_INVALIDARG
;
1665 if(reg
->regnum
> 0) {
1666 WARN("Only predicate register 0 is supported\n");
1667 This
->state
= E_INVALIDARG
;
1670 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1671 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
1672 token
|= 0 & D3DSP_REGNUM_MASK
; /* No shift */
1677 WARN("Invalid register type for 2.0 vshader\n");
1678 This
->state
= E_INVALIDARG
;
1682 token
|= d3d9_swizzle(reg
->u
.swizzle
) & D3DVS_SWIZZLE_MASK
; /* already shifted */
1684 token
|= d3d9_srcmod(reg
->srcmod
);
1687 token
|= D3DVS_ADDRMODE_RELATIVE
& D3DVS_ADDRESSMODE_MASK
;
1689 put_dword(buffer
, token
);
1691 /* vs_2_0 and newer write the register containing the index explicitly in the
1694 if(token
& D3DVS_ADDRMODE_RELATIVE
)
1695 vs_2_srcreg(This
, reg
->rel_reg
, buffer
);
1698 static void sm_2_opcode(struct bc_writer
*This
,
1699 const struct instruction
*instr
,
1700 DWORD token
, struct bytecode_buffer
*buffer
) {
1701 /* From sm 2 onwards instruction length is encoded in the opcode field */
1702 int dsts
= instr
->has_dst
? 1 : 0;
1703 token
|= instrlen(instr
, instr
->num_srcs
, dsts
) << D3DSI_INSTLENGTH_SHIFT
;
1705 token
|= (d3d9_comparetype(instr
->comptype
) << 16) & (0xf << 16);
1706 if(instr
->has_predicate
)
1707 token
|= D3DSHADER_INSTRUCTION_PREDICATED
;
1708 put_dword(buffer
,token
);
1711 static const struct instr_handler_table vs_2_0_handlers
[] = {
1712 {BWRITERSIO_ADD
, instr_handler
},
1713 {BWRITERSIO_NOP
, instr_handler
},
1714 {BWRITERSIO_MOV
, instr_handler
},
1715 {BWRITERSIO_SUB
, instr_handler
},
1716 {BWRITERSIO_MAD
, instr_handler
},
1717 {BWRITERSIO_MUL
, instr_handler
},
1718 {BWRITERSIO_RCP
, instr_handler
},
1719 {BWRITERSIO_RSQ
, instr_handler
},
1720 {BWRITERSIO_DP3
, instr_handler
},
1721 {BWRITERSIO_DP4
, instr_handler
},
1722 {BWRITERSIO_MIN
, instr_handler
},
1723 {BWRITERSIO_MAX
, instr_handler
},
1724 {BWRITERSIO_SLT
, instr_handler
},
1725 {BWRITERSIO_SGE
, instr_handler
},
1726 {BWRITERSIO_ABS
, instr_handler
},
1727 {BWRITERSIO_EXP
, instr_handler
},
1728 {BWRITERSIO_LOG
, instr_handler
},
1729 {BWRITERSIO_EXPP
, instr_handler
},
1730 {BWRITERSIO_LOGP
, instr_handler
},
1731 {BWRITERSIO_DST
, instr_handler
},
1732 {BWRITERSIO_LRP
, instr_handler
},
1733 {BWRITERSIO_FRC
, instr_handler
},
1734 {BWRITERSIO_CRS
, instr_handler
},
1735 {BWRITERSIO_SGN
, instr_handler
},
1736 {BWRITERSIO_NRM
, instr_handler
},
1737 {BWRITERSIO_SINCOS
, instr_handler
},
1738 {BWRITERSIO_M4x4
, instr_handler
},
1739 {BWRITERSIO_M4x3
, instr_handler
},
1740 {BWRITERSIO_M3x4
, instr_handler
},
1741 {BWRITERSIO_M3x3
, instr_handler
},
1742 {BWRITERSIO_M3x2
, instr_handler
},
1743 {BWRITERSIO_LIT
, instr_handler
},
1744 {BWRITERSIO_POW
, instr_handler
},
1745 {BWRITERSIO_MOVA
, instr_handler
},
1747 {BWRITERSIO_CALL
, instr_handler
},
1748 {BWRITERSIO_CALLNZ
, instr_handler
},
1749 {BWRITERSIO_REP
, instr_handler
},
1750 {BWRITERSIO_ENDREP
, instr_handler
},
1751 {BWRITERSIO_IF
, instr_handler
},
1752 {BWRITERSIO_LABEL
, instr_handler
},
1753 {BWRITERSIO_ELSE
, instr_handler
},
1754 {BWRITERSIO_ENDIF
, instr_handler
},
1755 {BWRITERSIO_LOOP
, instr_handler
},
1756 {BWRITERSIO_RET
, instr_handler
},
1757 {BWRITERSIO_ENDLOOP
, instr_handler
},
1759 {BWRITERSIO_END
, NULL
},
1762 static const struct bytecode_backend vs_2_0_backend
= {
1771 static const struct instr_handler_table vs_2_x_handlers
[] = {
1772 {BWRITERSIO_ADD
, instr_handler
},
1773 {BWRITERSIO_NOP
, instr_handler
},
1774 {BWRITERSIO_MOV
, instr_handler
},
1775 {BWRITERSIO_SUB
, instr_handler
},
1776 {BWRITERSIO_MAD
, instr_handler
},
1777 {BWRITERSIO_MUL
, instr_handler
},
1778 {BWRITERSIO_RCP
, instr_handler
},
1779 {BWRITERSIO_RSQ
, instr_handler
},
1780 {BWRITERSIO_DP3
, instr_handler
},
1781 {BWRITERSIO_DP4
, instr_handler
},
1782 {BWRITERSIO_MIN
, instr_handler
},
1783 {BWRITERSIO_MAX
, instr_handler
},
1784 {BWRITERSIO_SLT
, instr_handler
},
1785 {BWRITERSIO_SGE
, instr_handler
},
1786 {BWRITERSIO_ABS
, instr_handler
},
1787 {BWRITERSIO_EXP
, instr_handler
},
1788 {BWRITERSIO_LOG
, instr_handler
},
1789 {BWRITERSIO_EXPP
, instr_handler
},
1790 {BWRITERSIO_LOGP
, instr_handler
},
1791 {BWRITERSIO_DST
, instr_handler
},
1792 {BWRITERSIO_LRP
, instr_handler
},
1793 {BWRITERSIO_FRC
, instr_handler
},
1794 {BWRITERSIO_CRS
, instr_handler
},
1795 {BWRITERSIO_SGN
, instr_handler
},
1796 {BWRITERSIO_NRM
, instr_handler
},
1797 {BWRITERSIO_SINCOS
, instr_handler
},
1798 {BWRITERSIO_M4x4
, instr_handler
},
1799 {BWRITERSIO_M4x3
, instr_handler
},
1800 {BWRITERSIO_M3x4
, instr_handler
},
1801 {BWRITERSIO_M3x3
, instr_handler
},
1802 {BWRITERSIO_M3x2
, instr_handler
},
1803 {BWRITERSIO_LIT
, instr_handler
},
1804 {BWRITERSIO_POW
, instr_handler
},
1805 {BWRITERSIO_MOVA
, instr_handler
},
1807 {BWRITERSIO_CALL
, instr_handler
},
1808 {BWRITERSIO_CALLNZ
, instr_handler
},
1809 {BWRITERSIO_REP
, instr_handler
},
1810 {BWRITERSIO_ENDREP
, instr_handler
},
1811 {BWRITERSIO_IF
, instr_handler
},
1812 {BWRITERSIO_LABEL
, instr_handler
},
1813 {BWRITERSIO_IFC
, instr_handler
},
1814 {BWRITERSIO_ELSE
, instr_handler
},
1815 {BWRITERSIO_ENDIF
, instr_handler
},
1816 {BWRITERSIO_BREAK
, instr_handler
},
1817 {BWRITERSIO_BREAKC
, instr_handler
},
1818 {BWRITERSIO_LOOP
, instr_handler
},
1819 {BWRITERSIO_RET
, instr_handler
},
1820 {BWRITERSIO_ENDLOOP
, instr_handler
},
1822 {BWRITERSIO_SETP
, instr_handler
},
1823 {BWRITERSIO_BREAKP
, instr_handler
},
1825 {BWRITERSIO_END
, NULL
},
1828 static const struct bytecode_backend vs_2_x_backend
= {
1837 static void write_samplers(const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
) {
1839 DWORD instr_dcl
= D3DSIO_DCL
| (2 << D3DSI_INSTLENGTH_SHIFT
);
1841 const DWORD reg
= (1<<31) |
1842 ((D3DSPR_SAMPLER
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
) |
1843 ((D3DSPR_SAMPLER
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
) |
1844 D3DSP_WRITEMASK_ALL
;
1846 for(i
= 0; i
< shader
->num_samplers
; i
++) {
1847 /* Write the DCL instruction */
1848 put_dword(buffer
, instr_dcl
);
1850 /* Already shifted */
1851 token
|= (d3d9_sampler(shader
->samplers
[i
].type
)) & D3DSP_TEXTURETYPE_MASK
;
1852 put_dword(buffer
, token
);
1853 token
= reg
| (shader
->samplers
[i
].regnum
& D3DSP_REGNUM_MASK
);
1854 token
|= d3d9_dstmod(shader
->samplers
[i
].mod
);
1855 put_dword(buffer
, token
);
1859 static void ps_2_header(struct bc_writer
*This
, const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
) {
1860 HRESULT hr
= find_ps_builtin_semantics(This
, shader
, 8);
1866 write_declarations(This
, buffer
, TRUE
, shader
->inputs
, shader
->num_inputs
, BWRITERSPR_INPUT
);
1867 write_samplers(shader
, buffer
);
1868 write_constF(shader
, buffer
, TRUE
);
1869 write_constB(shader
, buffer
, TRUE
);
1870 write_constI(shader
, buffer
, TRUE
);
1873 static void ps_2_srcreg(struct bc_writer
*This
,
1874 const struct shader_reg
*reg
,
1875 struct bytecode_buffer
*buffer
) {
1876 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
1879 WARN("Relative addressing not supported in <= ps_3_0\n");
1880 This
->state
= E_INVALIDARG
;
1885 case BWRITERSPR_INPUT
:
1886 token
|= map_ps_input(This
, reg
);
1889 /* Can be mapped 1:1 */
1890 case BWRITERSPR_TEMP
:
1891 case BWRITERSPR_CONST
:
1892 case BWRITERSPR_COLOROUT
:
1893 case BWRITERSPR_CONSTBOOL
:
1894 case BWRITERSPR_CONSTINT
:
1895 case BWRITERSPR_SAMPLER
:
1896 case BWRITERSPR_LABEL
:
1897 case BWRITERSPR_DEPTHOUT
:
1898 d3d9reg
= d3d9_register(reg
->type
);
1899 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1900 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
1901 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1904 case BWRITERSPR_PREDICATE
:
1905 if(This
->version
!= BWRITERPS_VERSION(2, 1)){
1906 WARN("Predicate register not supported in ps_2_0\n");
1907 This
->state
= E_INVALIDARG
;
1910 WARN("Predicate register with regnum %u not supported\n",
1912 This
->state
= E_INVALIDARG
;
1914 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1915 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
1916 token
|= 0 & D3DSP_REGNUM_MASK
; /* No shift */
1920 WARN("Invalid register type for ps_2_0 shader\n");
1921 This
->state
= E_INVALIDARG
;
1925 token
|= d3d9_swizzle(reg
->u
.swizzle
) & D3DVS_SWIZZLE_MASK
; /* already shifted */
1927 token
|= d3d9_srcmod(reg
->srcmod
);
1928 put_dword(buffer
, token
);
1931 static void ps_2_0_dstreg(struct bc_writer
*This
,
1932 const struct shader_reg
*reg
,
1933 struct bytecode_buffer
*buffer
,
1934 DWORD shift
, DWORD mod
) {
1935 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
1939 WARN("Relative addressing not supported for destination registers\n");
1940 This
->state
= E_INVALIDARG
;
1945 case BWRITERSPR_TEMP
: /* 1:1 mapping */
1946 case BWRITERSPR_COLOROUT
:
1947 case BWRITERSPR_DEPTHOUT
:
1948 d3d9reg
= d3d9_register(reg
->type
);
1949 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1950 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
1951 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1954 case BWRITERSPR_PREDICATE
:
1955 if(This
->version
!= BWRITERPS_VERSION(2, 1)){
1956 WARN("Predicate register not supported in ps_2_0\n");
1957 This
->state
= E_INVALIDARG
;
1959 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
1960 token
|= (D3DSPR_PREDICATE
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
1961 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
1964 /* texkill uses the input register as a destination parameter */
1965 case BWRITERSPR_INPUT
:
1966 token
|= map_ps_input(This
, reg
);
1970 WARN("Invalid dest register type for 2.x pshader\n");
1971 This
->state
= E_INVALIDARG
;
1975 token
|= (shift
<< D3DSP_DSTSHIFT_SHIFT
) & D3DSP_DSTSHIFT_MASK
;
1976 token
|= d3d9_dstmod(mod
);
1978 token
|= d3d9_writemask(reg
->u
.writemask
);
1979 put_dword(buffer
, token
);
1982 static const struct instr_handler_table ps_2_0_handlers
[] = {
1983 {BWRITERSIO_ADD
, instr_handler
},
1984 {BWRITERSIO_NOP
, instr_handler
},
1985 {BWRITERSIO_MOV
, instr_handler
},
1986 {BWRITERSIO_SUB
, instr_handler
},
1987 {BWRITERSIO_MAD
, instr_handler
},
1988 {BWRITERSIO_MUL
, instr_handler
},
1989 {BWRITERSIO_RCP
, instr_handler
},
1990 {BWRITERSIO_RSQ
, instr_handler
},
1991 {BWRITERSIO_DP3
, instr_handler
},
1992 {BWRITERSIO_DP4
, instr_handler
},
1993 {BWRITERSIO_MIN
, instr_handler
},
1994 {BWRITERSIO_MAX
, instr_handler
},
1995 {BWRITERSIO_ABS
, instr_handler
},
1996 {BWRITERSIO_EXP
, instr_handler
},
1997 {BWRITERSIO_LOG
, instr_handler
},
1998 {BWRITERSIO_EXPP
, instr_handler
},
1999 {BWRITERSIO_LOGP
, instr_handler
},
2000 {BWRITERSIO_LRP
, instr_handler
},
2001 {BWRITERSIO_FRC
, instr_handler
},
2002 {BWRITERSIO_CRS
, instr_handler
},
2003 {BWRITERSIO_NRM
, instr_handler
},
2004 {BWRITERSIO_SINCOS
, instr_handler
},
2005 {BWRITERSIO_M4x4
, instr_handler
},
2006 {BWRITERSIO_M4x3
, instr_handler
},
2007 {BWRITERSIO_M3x4
, instr_handler
},
2008 {BWRITERSIO_M3x3
, instr_handler
},
2009 {BWRITERSIO_M3x2
, instr_handler
},
2010 {BWRITERSIO_POW
, instr_handler
},
2011 {BWRITERSIO_DP2ADD
, instr_handler
},
2012 {BWRITERSIO_CMP
, instr_handler
},
2014 {BWRITERSIO_TEX
, instr_handler
},
2015 {BWRITERSIO_TEXLDP
, instr_handler
},
2016 {BWRITERSIO_TEXLDB
, instr_handler
},
2017 {BWRITERSIO_TEXKILL
, instr_handler
},
2019 {BWRITERSIO_END
, NULL
},
2022 static const struct bytecode_backend ps_2_0_backend
= {
2031 static const struct instr_handler_table ps_2_x_handlers
[] = {
2032 {BWRITERSIO_ADD
, instr_handler
},
2033 {BWRITERSIO_NOP
, instr_handler
},
2034 {BWRITERSIO_MOV
, instr_handler
},
2035 {BWRITERSIO_SUB
, instr_handler
},
2036 {BWRITERSIO_MAD
, instr_handler
},
2037 {BWRITERSIO_MUL
, instr_handler
},
2038 {BWRITERSIO_RCP
, instr_handler
},
2039 {BWRITERSIO_RSQ
, instr_handler
},
2040 {BWRITERSIO_DP3
, instr_handler
},
2041 {BWRITERSIO_DP4
, instr_handler
},
2042 {BWRITERSIO_MIN
, instr_handler
},
2043 {BWRITERSIO_MAX
, instr_handler
},
2044 {BWRITERSIO_ABS
, instr_handler
},
2045 {BWRITERSIO_EXP
, instr_handler
},
2046 {BWRITERSIO_LOG
, instr_handler
},
2047 {BWRITERSIO_EXPP
, instr_handler
},
2048 {BWRITERSIO_LOGP
, instr_handler
},
2049 {BWRITERSIO_LRP
, instr_handler
},
2050 {BWRITERSIO_FRC
, instr_handler
},
2051 {BWRITERSIO_CRS
, instr_handler
},
2052 {BWRITERSIO_NRM
, instr_handler
},
2053 {BWRITERSIO_SINCOS
, instr_handler
},
2054 {BWRITERSIO_M4x4
, instr_handler
},
2055 {BWRITERSIO_M4x3
, instr_handler
},
2056 {BWRITERSIO_M3x4
, instr_handler
},
2057 {BWRITERSIO_M3x3
, instr_handler
},
2058 {BWRITERSIO_M3x2
, instr_handler
},
2059 {BWRITERSIO_POW
, instr_handler
},
2060 {BWRITERSIO_DP2ADD
, instr_handler
},
2061 {BWRITERSIO_CMP
, instr_handler
},
2063 {BWRITERSIO_CALL
, instr_handler
},
2064 {BWRITERSIO_CALLNZ
, instr_handler
},
2065 {BWRITERSIO_REP
, instr_handler
},
2066 {BWRITERSIO_ENDREP
, instr_handler
},
2067 {BWRITERSIO_IF
, instr_handler
},
2068 {BWRITERSIO_LABEL
, instr_handler
},
2069 {BWRITERSIO_IFC
, instr_handler
},
2070 {BWRITERSIO_ELSE
, instr_handler
},
2071 {BWRITERSIO_ENDIF
, instr_handler
},
2072 {BWRITERSIO_BREAK
, instr_handler
},
2073 {BWRITERSIO_BREAKC
, instr_handler
},
2074 {BWRITERSIO_RET
, instr_handler
},
2076 {BWRITERSIO_TEX
, instr_handler
},
2077 {BWRITERSIO_TEXLDP
, instr_handler
},
2078 {BWRITERSIO_TEXLDB
, instr_handler
},
2079 {BWRITERSIO_TEXKILL
, instr_handler
},
2080 {BWRITERSIO_DSX
, instr_handler
},
2081 {BWRITERSIO_DSY
, instr_handler
},
2083 {BWRITERSIO_SETP
, instr_handler
},
2084 {BWRITERSIO_BREAKP
, instr_handler
},
2086 {BWRITERSIO_TEXLDD
, instr_handler
},
2088 {BWRITERSIO_END
, NULL
},
2091 static const struct bytecode_backend ps_2_x_backend
= {
2100 static void sm_3_header(struct bc_writer
*This
, const struct bwriter_shader
*shader
, struct bytecode_buffer
*buffer
) {
2101 write_declarations(This
, buffer
, TRUE
, shader
->inputs
, shader
->num_inputs
, BWRITERSPR_INPUT
);
2102 write_declarations(This
, buffer
, TRUE
, shader
->outputs
, shader
->num_outputs
, BWRITERSPR_OUTPUT
);
2103 write_constF(shader
, buffer
, TRUE
);
2104 write_constB(shader
, buffer
, TRUE
);
2105 write_constI(shader
, buffer
, TRUE
);
2106 write_samplers(shader
, buffer
);
2109 static void sm_3_srcreg(struct bc_writer
*This
,
2110 const struct shader_reg
*reg
,
2111 struct bytecode_buffer
*buffer
) {
2112 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
2115 d3d9reg
= d3d9_register(reg
->type
);
2116 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
2117 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
2118 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
;
2120 token
|= d3d9_swizzle(reg
->u
.swizzle
) & D3DVS_SWIZZLE_MASK
;
2121 token
|= d3d9_srcmod(reg
->srcmod
);
2124 if(reg
->type
== BWRITERSPR_CONST
&& This
->version
== BWRITERPS_VERSION(3, 0)) {
2125 WARN("c%u[...] is unsupported in ps_3_0\n", reg
->regnum
);
2126 This
->state
= E_INVALIDARG
;
2129 if(((reg
->rel_reg
->type
== BWRITERSPR_ADDR
&& This
->version
== BWRITERVS_VERSION(3, 0)) ||
2130 reg
->rel_reg
->type
== BWRITERSPR_LOOP
) &&
2131 reg
->rel_reg
->regnum
== 0) {
2132 token
|= D3DVS_ADDRMODE_RELATIVE
& D3DVS_ADDRESSMODE_MASK
;
2134 WARN("Unsupported relative addressing register\n");
2135 This
->state
= E_INVALIDARG
;
2140 put_dword(buffer
, token
);
2142 /* vs_2_0 and newer write the register containing the index explicitly in the
2145 if(token
& D3DVS_ADDRMODE_RELATIVE
) {
2146 sm_3_srcreg(This
, reg
->rel_reg
, buffer
);
2150 static void sm_3_dstreg(struct bc_writer
*This
,
2151 const struct shader_reg
*reg
,
2152 struct bytecode_buffer
*buffer
,
2153 DWORD shift
, DWORD mod
) {
2154 DWORD token
= (1 << 31); /* Bit 31 of registers is 1 */
2158 if(This
->version
== BWRITERVS_VERSION(3, 0) &&
2159 reg
->type
== BWRITERSPR_OUTPUT
) {
2160 token
|= D3DVS_ADDRMODE_RELATIVE
& D3DVS_ADDRESSMODE_MASK
;
2162 WARN("Relative addressing not supported for this shader type or register type\n");
2163 This
->state
= E_INVALIDARG
;
2168 d3d9reg
= d3d9_register(reg
->type
);
2169 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT
) & D3DSP_REGTYPE_MASK
;
2170 token
|= (d3d9reg
<< D3DSP_REGTYPE_SHIFT2
) & D3DSP_REGTYPE_MASK2
;
2171 token
|= reg
->regnum
& D3DSP_REGNUM_MASK
; /* No shift */
2173 token
|= d3d9_dstmod(mod
);
2175 token
|= d3d9_writemask(reg
->u
.writemask
);
2176 put_dword(buffer
, token
);
2178 /* vs_2_0 and newer write the register containing the index explicitly in the
2181 if(token
& D3DVS_ADDRMODE_RELATIVE
) {
2182 sm_3_srcreg(This
, reg
->rel_reg
, buffer
);
2186 static const struct instr_handler_table vs_3_handlers
[] = {
2187 {BWRITERSIO_ADD
, instr_handler
},
2188 {BWRITERSIO_NOP
, instr_handler
},
2189 {BWRITERSIO_MOV
, instr_handler
},
2190 {BWRITERSIO_SUB
, instr_handler
},
2191 {BWRITERSIO_MAD
, instr_handler
},
2192 {BWRITERSIO_MUL
, instr_handler
},
2193 {BWRITERSIO_RCP
, instr_handler
},
2194 {BWRITERSIO_RSQ
, instr_handler
},
2195 {BWRITERSIO_DP3
, instr_handler
},
2196 {BWRITERSIO_DP4
, instr_handler
},
2197 {BWRITERSIO_MIN
, instr_handler
},
2198 {BWRITERSIO_MAX
, instr_handler
},
2199 {BWRITERSIO_SLT
, instr_handler
},
2200 {BWRITERSIO_SGE
, instr_handler
},
2201 {BWRITERSIO_ABS
, instr_handler
},
2202 {BWRITERSIO_EXP
, instr_handler
},
2203 {BWRITERSIO_LOG
, instr_handler
},
2204 {BWRITERSIO_EXPP
, instr_handler
},
2205 {BWRITERSIO_LOGP
, instr_handler
},
2206 {BWRITERSIO_DST
, instr_handler
},
2207 {BWRITERSIO_LRP
, instr_handler
},
2208 {BWRITERSIO_FRC
, instr_handler
},
2209 {BWRITERSIO_CRS
, instr_handler
},
2210 {BWRITERSIO_SGN
, instr_handler
},
2211 {BWRITERSIO_NRM
, instr_handler
},
2212 {BWRITERSIO_SINCOS
, instr_handler
},
2213 {BWRITERSIO_M4x4
, instr_handler
},
2214 {BWRITERSIO_M4x3
, instr_handler
},
2215 {BWRITERSIO_M3x4
, instr_handler
},
2216 {BWRITERSIO_M3x3
, instr_handler
},
2217 {BWRITERSIO_M3x2
, instr_handler
},
2218 {BWRITERSIO_LIT
, instr_handler
},
2219 {BWRITERSIO_POW
, instr_handler
},
2220 {BWRITERSIO_MOVA
, instr_handler
},
2222 {BWRITERSIO_CALL
, instr_handler
},
2223 {BWRITERSIO_CALLNZ
, instr_handler
},
2224 {BWRITERSIO_REP
, instr_handler
},
2225 {BWRITERSIO_ENDREP
, instr_handler
},
2226 {BWRITERSIO_IF
, instr_handler
},
2227 {BWRITERSIO_LABEL
, instr_handler
},
2228 {BWRITERSIO_IFC
, instr_handler
},
2229 {BWRITERSIO_ELSE
, instr_handler
},
2230 {BWRITERSIO_ENDIF
, instr_handler
},
2231 {BWRITERSIO_BREAK
, instr_handler
},
2232 {BWRITERSIO_BREAKC
, instr_handler
},
2233 {BWRITERSIO_LOOP
, instr_handler
},
2234 {BWRITERSIO_RET
, instr_handler
},
2235 {BWRITERSIO_ENDLOOP
, instr_handler
},
2237 {BWRITERSIO_SETP
, instr_handler
},
2238 {BWRITERSIO_BREAKP
, instr_handler
},
2239 {BWRITERSIO_TEXLDL
, instr_handler
},
2241 {BWRITERSIO_END
, NULL
},
2244 static const struct bytecode_backend vs_3_backend
= {
2253 static const struct instr_handler_table ps_3_handlers
[] = {
2254 {BWRITERSIO_ADD
, instr_handler
},
2255 {BWRITERSIO_NOP
, instr_handler
},
2256 {BWRITERSIO_MOV
, instr_handler
},
2257 {BWRITERSIO_SUB
, instr_handler
},
2258 {BWRITERSIO_MAD
, instr_handler
},
2259 {BWRITERSIO_MUL
, instr_handler
},
2260 {BWRITERSIO_RCP
, instr_handler
},
2261 {BWRITERSIO_RSQ
, instr_handler
},
2262 {BWRITERSIO_DP3
, instr_handler
},
2263 {BWRITERSIO_DP4
, instr_handler
},
2264 {BWRITERSIO_MIN
, instr_handler
},
2265 {BWRITERSIO_MAX
, instr_handler
},
2266 {BWRITERSIO_ABS
, instr_handler
},
2267 {BWRITERSIO_EXP
, instr_handler
},
2268 {BWRITERSIO_LOG
, instr_handler
},
2269 {BWRITERSIO_EXPP
, instr_handler
},
2270 {BWRITERSIO_LOGP
, instr_handler
},
2271 {BWRITERSIO_LRP
, instr_handler
},
2272 {BWRITERSIO_FRC
, instr_handler
},
2273 {BWRITERSIO_CRS
, instr_handler
},
2274 {BWRITERSIO_NRM
, instr_handler
},
2275 {BWRITERSIO_SINCOS
, instr_handler
},
2276 {BWRITERSIO_M4x4
, instr_handler
},
2277 {BWRITERSIO_M4x3
, instr_handler
},
2278 {BWRITERSIO_M3x4
, instr_handler
},
2279 {BWRITERSIO_M3x3
, instr_handler
},
2280 {BWRITERSIO_M3x2
, instr_handler
},
2281 {BWRITERSIO_POW
, instr_handler
},
2282 {BWRITERSIO_DP2ADD
, instr_handler
},
2283 {BWRITERSIO_CMP
, instr_handler
},
2285 {BWRITERSIO_CALL
, instr_handler
},
2286 {BWRITERSIO_CALLNZ
, instr_handler
},
2287 {BWRITERSIO_REP
, instr_handler
},
2288 {BWRITERSIO_ENDREP
, instr_handler
},
2289 {BWRITERSIO_IF
, instr_handler
},
2290 {BWRITERSIO_LABEL
, instr_handler
},
2291 {BWRITERSIO_IFC
, instr_handler
},
2292 {BWRITERSIO_ELSE
, instr_handler
},
2293 {BWRITERSIO_ENDIF
, instr_handler
},
2294 {BWRITERSIO_BREAK
, instr_handler
},
2295 {BWRITERSIO_BREAKC
, instr_handler
},
2296 {BWRITERSIO_LOOP
, instr_handler
},
2297 {BWRITERSIO_RET
, instr_handler
},
2298 {BWRITERSIO_ENDLOOP
, instr_handler
},
2300 {BWRITERSIO_SETP
, instr_handler
},
2301 {BWRITERSIO_BREAKP
, instr_handler
},
2302 {BWRITERSIO_TEXLDL
, instr_handler
},
2304 {BWRITERSIO_TEX
, instr_handler
},
2305 {BWRITERSIO_TEXLDP
, instr_handler
},
2306 {BWRITERSIO_TEXLDB
, instr_handler
},
2307 {BWRITERSIO_TEXKILL
, instr_handler
},
2308 {BWRITERSIO_DSX
, instr_handler
},
2309 {BWRITERSIO_DSY
, instr_handler
},
2310 {BWRITERSIO_TEXLDD
, instr_handler
},
2312 {BWRITERSIO_END
, NULL
},
2315 static const struct bytecode_backend ps_3_backend
= {
2324 static void init_vs10_dx9_writer(struct bc_writer
*writer
) {
2325 TRACE("Creating DirectX9 vertex shader 1.0 writer\n");
2326 writer
->funcs
= &vs_1_x_backend
;
2329 static void init_vs11_dx9_writer(struct bc_writer
*writer
) {
2330 TRACE("Creating DirectX9 vertex shader 1.1 writer\n");
2331 writer
->funcs
= &vs_1_x_backend
;
2334 static void init_vs20_dx9_writer(struct bc_writer
*writer
) {
2335 TRACE("Creating DirectX9 vertex shader 2.0 writer\n");
2336 writer
->funcs
= &vs_2_0_backend
;
2339 static void init_vs2x_dx9_writer(struct bc_writer
*writer
) {
2340 TRACE("Creating DirectX9 vertex shader 2.x writer\n");
2341 writer
->funcs
= &vs_2_x_backend
;
2344 static void init_vs30_dx9_writer(struct bc_writer
*writer
) {
2345 TRACE("Creating DirectX9 vertex shader 3.0 writer\n");
2346 writer
->funcs
= &vs_3_backend
;
2349 static void init_ps10_dx9_writer(struct bc_writer
*writer
) {
2350 TRACE("Creating DirectX9 pixel shader 1.0 writer\n");
2351 writer
->funcs
= &ps_1_0123_backend
;
2354 static void init_ps11_dx9_writer(struct bc_writer
*writer
) {
2355 TRACE("Creating DirectX9 pixel shader 1.1 writer\n");
2356 writer
->funcs
= &ps_1_0123_backend
;
2359 static void init_ps12_dx9_writer(struct bc_writer
*writer
) {
2360 TRACE("Creating DirectX9 pixel shader 1.2 writer\n");
2361 writer
->funcs
= &ps_1_0123_backend
;
2364 static void init_ps13_dx9_writer(struct bc_writer
*writer
) {
2365 TRACE("Creating DirectX9 pixel shader 1.3 writer\n");
2366 writer
->funcs
= &ps_1_0123_backend
;
2369 static void init_ps14_dx9_writer(struct bc_writer
*writer
) {
2370 TRACE("Creating DirectX9 pixel shader 1.4 writer\n");
2371 writer
->funcs
= &ps_1_4_backend
;
2374 static void init_ps20_dx9_writer(struct bc_writer
*writer
) {
2375 TRACE("Creating DirectX9 pixel shader 2.0 writer\n");
2376 writer
->funcs
= &ps_2_0_backend
;
2379 static void init_ps2x_dx9_writer(struct bc_writer
*writer
) {
2380 TRACE("Creating DirectX9 pixel shader 2.x writer\n");
2381 writer
->funcs
= &ps_2_x_backend
;
2384 static void init_ps30_dx9_writer(struct bc_writer
*writer
) {
2385 TRACE("Creating DirectX9 pixel shader 3.0 writer\n");
2386 writer
->funcs
= &ps_3_backend
;
2389 static struct bc_writer
*create_writer(DWORD version
, DWORD dxversion
) {
2390 struct bc_writer
*ret
= d3dcompiler_alloc(sizeof(*ret
));
2393 WARN("Failed to allocate a bytecode writer instance\n");
2398 case BWRITERVS_VERSION(1, 0):
2399 if(dxversion
!= 9) {
2400 WARN("Unsupported dxversion for vertex shader 1.0 requested: %u\n", dxversion
);
2403 init_vs10_dx9_writer(ret
);
2405 case BWRITERVS_VERSION(1, 1):
2406 if(dxversion
!= 9) {
2407 WARN("Unsupported dxversion for vertex shader 1.1 requested: %u\n", dxversion
);
2410 init_vs11_dx9_writer(ret
);
2412 case BWRITERVS_VERSION(2, 0):
2413 if(dxversion
!= 9) {
2414 WARN("Unsupported dxversion for vertex shader 2.0 requested: %u\n", dxversion
);
2417 init_vs20_dx9_writer(ret
);
2419 case BWRITERVS_VERSION(2, 1):
2420 if(dxversion
!= 9) {
2421 WARN("Unsupported dxversion for vertex shader 2.x requested: %u\n", dxversion
);
2424 init_vs2x_dx9_writer(ret
);
2426 case BWRITERVS_VERSION(3, 0):
2427 if(dxversion
!= 9) {
2428 WARN("Unsupported dxversion for vertex shader 3.0 requested: %u\n", dxversion
);
2431 init_vs30_dx9_writer(ret
);
2434 case BWRITERPS_VERSION(1, 0):
2435 if(dxversion
!= 9) {
2436 WARN("Unsupported dxversion for pixel shader 1.0 requested: %u\n", dxversion
);
2439 init_ps10_dx9_writer(ret
);
2441 case BWRITERPS_VERSION(1, 1):
2442 if(dxversion
!= 9) {
2443 WARN("Unsupported dxversion for pixel shader 1.1 requested: %u\n", dxversion
);
2446 init_ps11_dx9_writer(ret
);
2448 case BWRITERPS_VERSION(1, 2):
2449 if(dxversion
!= 9) {
2450 WARN("Unsupported dxversion for pixel shader 1.2 requested: %u\n", dxversion
);
2453 init_ps12_dx9_writer(ret
);
2455 case BWRITERPS_VERSION(1, 3):
2456 if(dxversion
!= 9) {
2457 WARN("Unsupported dxversion for pixel shader 1.3 requested: %u\n", dxversion
);
2460 init_ps13_dx9_writer(ret
);
2462 case BWRITERPS_VERSION(1, 4):
2463 if(dxversion
!= 9) {
2464 WARN("Unsupported dxversion for pixel shader 1.4 requested: %u\n", dxversion
);
2467 init_ps14_dx9_writer(ret
);
2470 case BWRITERPS_VERSION(2, 0):
2471 if(dxversion
!= 9) {
2472 WARN("Unsupported dxversion for pixel shader 2.0 requested: %u\n", dxversion
);
2475 init_ps20_dx9_writer(ret
);
2478 case BWRITERPS_VERSION(2, 1):
2479 if(dxversion
!= 9) {
2480 WARN("Unsupported dxversion for pixel shader 2.x requested: %u\n", dxversion
);
2483 init_ps2x_dx9_writer(ret
);
2486 case BWRITERPS_VERSION(3, 0):
2487 if(dxversion
!= 9) {
2488 WARN("Unsupported dxversion for pixel shader 3.0 requested: %u\n", dxversion
);
2491 init_ps30_dx9_writer(ret
);
2495 WARN("Unexpected shader version requested: %08x\n", version
);
2498 ret
->version
= version
;
2502 d3dcompiler_free(ret
);
2506 static HRESULT
call_instr_handler(struct bc_writer
*writer
,
2507 const struct instruction
*instr
,
2508 struct bytecode_buffer
*buffer
) {
2511 while(writer
->funcs
->instructions
[i
].opcode
!= BWRITERSIO_END
) {
2512 if(instr
->opcode
== writer
->funcs
->instructions
[i
].opcode
) {
2513 if(!writer
->funcs
->instructions
[i
].func
) {
2514 WARN("Opcode %u not supported by this profile\n", instr
->opcode
);
2515 return E_INVALIDARG
;
2517 writer
->funcs
->instructions
[i
].func(writer
, instr
, buffer
);
2523 FIXME("Unhandled instruction %u - %s\n", instr
->opcode
,
2524 debug_print_opcode(instr
->opcode
));
2525 return E_INVALIDARG
;
2528 HRESULT
SlWriteBytecode(const struct bwriter_shader
*shader
, int dxversion
, DWORD
**result
, DWORD
*size
)
2530 struct bc_writer
*writer
;
2531 struct bytecode_buffer
*buffer
= NULL
;
2536 ERR("NULL shader structure, aborting\n");
2539 writer
= create_writer(shader
->version
, dxversion
);
2543 WARN("Could not create a bytecode writer instance. Either unsupported version\n");
2544 WARN("or out of memory\n");
2549 buffer
= allocate_buffer();
2551 WARN("Failed to allocate a buffer for the shader bytecode\n");
2556 /* Write shader type and version */
2557 put_dword(buffer
, shader
->version
);
2559 writer
->funcs
->header(writer
, shader
, buffer
);
2560 if(FAILED(writer
->state
)) {
2565 for(i
= 0; i
< shader
->num_instrs
; i
++) {
2566 hr
= call_instr_handler(writer
, shader
->instr
[i
], buffer
);
2572 if(FAILED(writer
->state
)) {
2577 writer
->funcs
->end(writer
, shader
, buffer
);
2579 if(FAILED(buffer
->state
)) {
2584 *size
= buffer
->size
* sizeof(DWORD
);
2585 *result
= buffer
->data
;
2586 buffer
->data
= NULL
;
2591 d3dcompiler_free(buffer
->data
);
2592 d3dcompiler_free(buffer
);
2594 d3dcompiler_free(writer
);
2598 void SlDeleteShader(struct bwriter_shader
*shader
) {
2601 TRACE("Deleting shader %p\n", shader
);
2603 for(i
= 0; i
< shader
->num_cf
; i
++) {
2604 d3dcompiler_free(shader
->constF
[i
]);
2606 d3dcompiler_free(shader
->constF
);
2607 for(i
= 0; i
< shader
->num_ci
; i
++) {
2608 d3dcompiler_free(shader
->constI
[i
]);
2610 d3dcompiler_free(shader
->constI
);
2611 for(i
= 0; i
< shader
->num_cb
; i
++) {
2612 d3dcompiler_free(shader
->constB
[i
]);
2614 d3dcompiler_free(shader
->constB
);
2616 d3dcompiler_free(shader
->inputs
);
2617 d3dcompiler_free(shader
->outputs
);
2618 d3dcompiler_free(shader
->samplers
);
2620 for(i
= 0; i
< shader
->num_instrs
; i
++) {
2621 for(j
= 0; j
< shader
->instr
[i
]->num_srcs
; j
++) {
2622 d3dcompiler_free(shader
->instr
[i
]->src
[j
].rel_reg
);
2624 d3dcompiler_free(shader
->instr
[i
]->src
);
2625 d3dcompiler_free(shader
->instr
[i
]);
2627 d3dcompiler_free(shader
->instr
);
2629 d3dcompiler_free(shader
);