1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 **********************************************************/
26 #include "util/u_inlines.h"
27 #include "pipe/p_defines.h"
28 #include "util/u_format.h"
29 #include "util/u_math.h"
30 #include "util/u_bitmask.h"
31 #include "translate/translate.h"
33 #include "svga_context.h"
34 #include "svga_state.h"
36 #include "svga_tgsi.h"
38 #include "svga_hw_reg.h"
40 /***********************************************************************
44 static INLINE int compare_vs_keys( const struct svga_vs_compile_key *a,
45 const struct svga_vs_compile_key *b )
47 unsigned keysize = svga_vs_key_size( a );
48 return memcmp( a, b, keysize );
52 static struct svga_shader_result *search_vs_key( struct svga_vertex_shader *vs,
53 const struct svga_vs_compile_key *key )
55 struct svga_shader_result *result = vs->base.results;
59 for ( ; result; result = result->next) {
60 if (compare_vs_keys( key, &result->key.vkey ) == 0)
68 static enum pipe_error compile_vs( struct svga_context *svga,
69 struct svga_vertex_shader *vs,
70 const struct svga_vs_compile_key *key,
71 struct svga_shader_result **out_result )
73 struct svga_shader_result *result;
74 enum pipe_error ret = PIPE_ERROR;
76 result = svga_translate_vertex_program( vs, key );
78 ret = PIPE_ERROR_OUT_OF_MEMORY;
82 result->id = util_bitmask_add(svga->vs_bm);
83 if(result->id == UTIL_BITMASK_INVALID_INDEX) {
84 ret = PIPE_ERROR_OUT_OF_MEMORY;
88 ret = SVGA3D_DefineShader(svga->swc,
92 result->nr_tokens * sizeof result->tokens[0]);
97 result->next = vs->base.results;
98 vs->base.results = result;
103 if (result->id != UTIL_BITMASK_INVALID_INDEX)
104 util_bitmask_clear( svga->vs_bm, result->id );
105 svga_destroy_shader_result( result );
110 /* SVGA_NEW_PRESCALE, SVGA_NEW_RAST, SVGA_NEW_ZERO_STRIDE
112 static int make_vs_key( struct svga_context *svga,
113 struct svga_vs_compile_key *key )
115 memset(key, 0, sizeof *key);
116 key->need_prescale = svga->state.hw_clear.prescale.enabled;
117 key->allow_psiz = svga->curr.rast->templ.point_size_per_vertex;
118 key->zero_stride_vertex_elements =
119 svga->curr.zero_stride_vertex_elements;
120 key->num_zero_stride_vertex_elements =
121 svga->curr.num_zero_stride_vertex_elements;
127 static int emit_hw_vs( struct svga_context *svga,
130 struct svga_shader_result *result = NULL;
131 unsigned id = SVGA3D_INVALID_ID;
134 /* SVGA_NEW_NEED_SWTNL */
135 if (!svga->state.sw.need_swtnl) {
136 struct svga_vertex_shader *vs = svga->curr.vs;
137 struct svga_vs_compile_key key;
139 ret = make_vs_key( svga, &key );
143 result = search_vs_key( vs, &key );
145 ret = compile_vs( svga, vs, &key, &result );
154 if (result != svga->state.hw_draw.vs) {
155 ret = SVGA3D_SetShader(svga->swc,
156 SVGA3D_SHADERTYPE_VS,
161 svga->dirty |= SVGA_NEW_VS_RESULT;
162 svga->state.hw_draw.vs = result;
168 struct svga_tracked_state svga_hw_vs =
170 "vertex shader (hwtnl)",
173 SVGA_NEW_NEED_SWTNL |
174 SVGA_NEW_ZERO_STRIDE),
179 /***********************************************************************
181 static int update_zero_stride( struct svga_context *svga,
186 svga->curr.zero_stride_vertex_elements = 0;
187 svga->curr.num_zero_stride_vertex_elements = 0;
189 for (i = 0; i < svga->curr.velems->count; i++) {
190 const struct pipe_vertex_element *vel = &svga->curr.velems->velem[i];
191 const struct pipe_vertex_buffer *vbuffer = &svga->curr.vb[
192 vel->vertex_buffer_index];
194 if (vbuffer->stride == 0) {
196 svga->curr.num_zero_stride_vertex_elements;
197 struct pipe_transfer *transfer;
198 struct translate *translate;
199 struct translate_key key;
202 svga->curr.zero_stride_vertex_elements |= (1 << i);
203 ++svga->curr.num_zero_stride_vertex_elements;
205 key.output_stride = 4 * sizeof(float);
207 key.element[0].type = TRANSLATE_ELEMENT_NORMAL;
208 key.element[0].input_format = vel->src_format;
209 key.element[0].output_format = PIPE_FORMAT_R32G32B32A32_FLOAT;
210 key.element[0].input_buffer = vel->vertex_buffer_index;
211 key.element[0].input_offset = vel->src_offset;
212 key.element[0].instance_divisor = vel->instance_divisor;
213 key.element[0].output_offset = const_idx * 4 * sizeof(float);
215 translate_key_sanitize(&key);
216 /* translate_generic_create is technically private but
217 * we don't want to code-generate, just want generic
219 translate = translate_generic_create(&key);
221 assert(vel->src_offset == 0);
223 mapped_buffer = pipe_buffer_map_range(&svga->pipe,
226 util_format_get_blocksize(vel->src_format),
230 translate->set_buffer(translate, vel->vertex_buffer_index,
232 vbuffer->stride, ~0);
233 translate->run(translate, 0, 1, 0,
234 svga->curr.zero_stride_constants);
236 pipe_buffer_unmap(&svga->pipe, transfer);
238 translate->release(translate);
242 if (svga->curr.num_zero_stride_vertex_elements)
243 svga->dirty |= SVGA_NEW_ZERO_STRIDE;
248 struct svga_tracked_state svga_hw_update_zero_stride =
250 "update zero_stride",
251 ( SVGA_NEW_VELEMENT |