1 /**************************************************************************
3 * Copyright 2007 Tungsten Graphics, Inc., Cedar Park, Texas.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 * Keith Whitwell <keith@tungstengraphics.com>
34 #include "util/u_math.h"
35 #include "util/u_memory.h"
37 #include "pipe/p_shader_tokens.h"
39 #include "draw_private.h"
40 #include "draw_context.h"
43 #include "translate/translate.h"
44 #include "translate/translate_cache.h"
46 #include "tgsi/tgsi_dump.h"
47 #include "tgsi/tgsi_exec.h"
49 DEBUG_GET_ONCE_BOOL_OPTION(gallium_dump_vs
, "GALLIUM_DUMP_VS", FALSE
)
53 * Set a vertex shader constant buffer.
54 * \param slot which constant buffer in [0, PIPE_MAX_CONSTANT_BUFFERS-1]
55 * \param constants the mapped buffer
56 * \param size size of buffer in bytes
59 draw_vs_set_constants(struct draw_context
*draw
,
61 const void *constants
,
64 const int alignment
= 16;
66 /* check if buffer is 16-byte aligned */
67 if (((uintptr_t)constants
) & (alignment
- 1)) {
68 /* if not, copy the constants into a new, 16-byte aligned buffer */
69 if (size
> draw
->vs
.const_storage_size
[slot
]) {
70 if (draw
->vs
.aligned_constant_storage
[slot
]) {
71 align_free((void *)draw
->vs
.aligned_constant_storage
[slot
]);
73 draw
->vs
.aligned_constant_storage
[slot
] =
74 align_malloc(size
, alignment
);
77 memcpy((void *)draw
->vs
.aligned_constant_storage
[slot
],
80 constants
= draw
->vs
.aligned_constant_storage
[slot
];
83 draw
->vs
.aligned_constants
[slot
] = constants
;
84 draw_vs_aos_machine_constants(draw
->vs
.aos_machine
, slot
, constants
);
88 void draw_vs_set_viewport( struct draw_context
*draw
,
89 const struct pipe_viewport_state
*viewport
)
91 draw_vs_aos_machine_viewport( draw
->vs
.aos_machine
, viewport
);
96 struct draw_vertex_shader
*
97 draw_create_vertex_shader(struct draw_context
*draw
,
98 const struct pipe_shader_state
*shader
)
100 struct draw_vertex_shader
*vs
= NULL
;
103 tgsi_dump(shader
->tokens
, 0);
106 if (!draw
->pt
.middle
.llvm
) {
108 /* these paths don't support vertex clamping
109 * TODO: either add it, or remove them completely
110 * use LLVM instead if you want performance
111 * use exec instead if you want debugging/more correctness
113 #if defined(PIPE_ARCH_X86)
114 vs
= draw_create_vs_sse( draw
, shader
);
115 #elif defined(PIPE_ARCH_PPC)
116 vs
= draw_create_vs_ppc( draw
, shader
);
122 vs
= draw_create_vs_llvm(draw
, shader
);
127 vs
= draw_create_vs_exec( draw
, shader
);
133 for (i
= 0; i
< vs
->info
.num_outputs
; i
++) {
134 if (vs
->info
.output_semantic_name
[i
] == TGSI_SEMANTIC_POSITION
&&
135 vs
->info
.output_semantic_index
[i
] == 0)
136 vs
->position_output
= i
;
137 else if (vs
->info
.output_semantic_name
[i
] == TGSI_SEMANTIC_EDGEFLAG
&&
138 vs
->info
.output_semantic_index
[i
] == 0)
139 vs
->edgeflag_output
= i
;
149 draw_bind_vertex_shader(struct draw_context
*draw
,
150 struct draw_vertex_shader
*dvs
)
152 draw_do_flush( draw
, DRAW_FLUSH_STATE_CHANGE
);
156 draw
->vs
.vertex_shader
= dvs
;
157 draw
->vs
.num_vs_outputs
= dvs
->info
.num_outputs
;
158 draw
->vs
.position_output
= dvs
->position_output
;
159 draw
->vs
.edgeflag_output
= dvs
->edgeflag_output
;
160 dvs
->prepare( dvs
, draw
);
163 draw
->vs
.vertex_shader
= NULL
;
164 draw
->vs
.num_vs_outputs
= 0;
170 draw_delete_vertex_shader(struct draw_context
*draw
,
171 struct draw_vertex_shader
*dvs
)
175 for (i
= 0; i
< dvs
->nr_variants
; i
++)
176 dvs
->variant
[i
]->destroy( dvs
->variant
[i
] );
178 dvs
->nr_variants
= 0;
186 draw_vs_init( struct draw_context
*draw
)
188 draw
->dump_vs
= debug_get_option_gallium_dump_vs();
190 draw
->vs
.machine
= tgsi_exec_machine_create();
191 if (!draw
->vs
.machine
)
194 draw
->vs
.emit_cache
= translate_cache_create();
195 if (!draw
->vs
.emit_cache
)
198 draw
->vs
.fetch_cache
= translate_cache_create();
199 if (!draw
->vs
.fetch_cache
)
202 draw
->vs
.aos_machine
= draw_vs_aos_machine();
204 if (!draw
->vs
.aos_machine
)
212 draw_vs_destroy( struct draw_context
*draw
)
216 if (draw
->vs
.fetch_cache
)
217 translate_cache_destroy(draw
->vs
.fetch_cache
);
219 if (draw
->vs
.emit_cache
)
220 translate_cache_destroy(draw
->vs
.emit_cache
);
222 if (draw
->vs
.aos_machine
)
223 draw_vs_aos_machine_destroy(draw
->vs
.aos_machine
);
225 for (i
= 0; i
< PIPE_MAX_CONSTANT_BUFFERS
; i
++) {
226 if (draw
->vs
.aligned_constant_storage
[i
]) {
227 align_free((void *)draw
->vs
.aligned_constant_storage
[i
]);
231 tgsi_exec_machine_destroy(draw
->vs
.machine
);
235 struct draw_vs_variant
*
236 draw_vs_lookup_variant( struct draw_vertex_shader
*vs
,
237 const struct draw_vs_variant_key
*key
)
239 struct draw_vs_variant
*variant
;
242 /* Lookup existing variant:
244 for (i
= 0; i
< vs
->nr_variants
; i
++)
245 if (draw_vs_variant_key_compare(key
, &vs
->variant
[i
]->key
) == 0)
246 return vs
->variant
[i
];
248 /* Else have to create a new one:
250 variant
= vs
->create_variant( vs
, key
);
254 /* Add it to our list, could be smarter:
256 if (vs
->nr_variants
< Elements(vs
->variant
)) {
257 vs
->variant
[vs
->nr_variants
++] = variant
;
261 vs
->last_variant
%= Elements(vs
->variant
);
262 vs
->variant
[vs
->last_variant
]->destroy(vs
->variant
[vs
->last_variant
]);
263 vs
->variant
[vs
->last_variant
] = variant
;
273 draw_vs_get_fetch( struct draw_context
*draw
,
274 struct translate_key
*key
)
276 if (!draw
->vs
.fetch
||
277 translate_key_compare(&draw
->vs
.fetch
->key
, key
) != 0)
279 translate_key_sanitize(key
);
280 draw
->vs
.fetch
= translate_cache_find(draw
->vs
.fetch_cache
, key
);
283 return draw
->vs
.fetch
;
287 draw_vs_get_emit( struct draw_context
*draw
,
288 struct translate_key
*key
)
290 if (!draw
->vs
.emit
||
291 translate_key_compare(&draw
->vs
.emit
->key
, key
) != 0)
293 translate_key_sanitize(key
);
294 draw
->vs
.emit
= translate_cache_find(draw
->vs
.emit_cache
, key
);
297 return draw
->vs
.emit
;