2 * Copyright 2008 Corbin Simpson <MostAwesomeDude@gmail.com>
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE. */
23 #ifndef R300_CONTEXT_H
24 #define R300_CONTEXT_H
26 #include "draw/draw_vertex.h"
28 #include "util/u_blitter.h"
30 #include "pipe/p_context.h"
31 #include "util/u_inlines.h"
32 #include "util/u_transfer.h"
33 #include "util/u_vbuf_mgr.h"
35 #include "r300_defines.h"
36 #include "r300_screen.h"
40 struct r300_fragment_shader;
41 struct r300_vertex_shader;
42 struct r300_stencilref_context;
45 /* Name, for debugging. */
49 /* Emit the state to the context. */
50 void (*emit)(struct r300_context*, unsigned, void*);
51 /* Upper bound on number of dwords to emit. */
53 /* Whether this atom should be emitted. */
55 /* Whether this atom may be emitted with state == NULL. */
56 boolean allow_null_state;
59 struct r300_aa_state {
60 struct r300_surface *dest;
63 uint32_t aaresolve_ctl;
66 struct r300_blend_state {
68 uint32_t cb_no_readwrite[8];
71 struct r300_blend_color_state {
75 struct r300_clip_state {
76 struct pipe_clip_state clip;
81 struct r300_dsa_state {
82 struct pipe_depth_stencil_alpha_state dsa;
84 /* This is actually a command buffer with named dwords. */
86 uint32_t alpha_function; /* R300_FG_ALPHA_FUNC: 0x4bd4 */
88 uint32_t z_buffer_control; /* R300_ZB_CNTL: 0x4f00 */
89 uint32_t z_stencil_control; /* R300_ZB_ZSTENCILCNTL: 0x4f04 */
90 uint32_t stencil_ref_mask; /* R300_ZB_STENCILREFMASK: 0x4f08 */
92 uint32_t stencil_ref_bf; /* R500_ZB_STENCILREFMASK_BF: 0x4fd4 */
94 /* The second command buffer disables zbuffer reads and writes. */
95 uint32_t cb_no_readwrite[8];
97 /* Whether a two-sided stencil is enabled. */
99 /* Whether a fallback should be used for a two-sided stencil ref value. */
100 boolean two_sided_stencil_ref;
103 struct r300_hyperz_state {
104 int current_func; /* -1 after a clear before first op */
106 /* This is actually a command buffer with named dwords. */
107 uint32_t cb_flush_begin;
108 uint32_t zb_zcache_ctlstat; /* R300_ZB_CACHE_CNTL */
110 uint32_t zb_bw_cntl; /* R300_ZB_BW_CNTL */
112 uint32_t zb_depthclearvalue; /* R300_ZB_DEPTHCLEARVALUE */
114 uint32_t sc_hyperz; /* R300_SC_HYPERZ */
116 uint32_t gb_z_peq_config; /* R300_GB_Z_PEQ_CONFIG: 0x4028 */
119 struct r300_gpu_flush {
120 uint32_t cb_flush_clean[6];
123 #define RS_STATE_MAIN_SIZE 23
125 struct r300_rs_state {
126 /* Original rasterizer state. */
127 struct pipe_rasterizer_state rs;
128 /* Draw-specific rasterizer state. */
129 struct pipe_rasterizer_state rs_draw;
131 /* Command buffers. */
132 uint32_t cb_main[RS_STATE_MAIN_SIZE];
133 uint32_t cb_poly_offset_zb16[5];
134 uint32_t cb_poly_offset_zb24[5];
136 /* The index to cb_main where the cull_mode register value resides. */
137 unsigned cull_mode_index;
139 /* Whether polygon offset is enabled. */
140 boolean polygon_offset_enable;
142 /* This is emitted in the draw function. */
143 uint32_t color_control; /* R300_GA_COLOR_CONTROL: 0x4278 */
146 struct r300_rs_block {
147 uint32_t vap_vtx_state_cntl; /* R300_VAP_VTX_STATE_CNTL: 0x2180 */
148 uint32_t vap_vsm_vtx_assm; /* R300_VAP_VSM_VTX_ASSM: 0x2184 */
149 uint32_t vap_out_vtx_fmt[2]; /* R300_VAP_OUTPUT_VTX_FMT_[0-1]: 0x2090 */
152 uint32_t ip[8]; /* R300_RS_IP_[0-7], R500_RS_IP_[0-7] */
153 uint32_t count; /* R300_RS_COUNT */
154 uint32_t inst_count; /* R300_RS_INST_COUNT */
155 uint32_t inst[8]; /* R300_RS_INST_[0-7] */
158 struct r300_sampler_state {
159 struct pipe_sampler_state state;
161 uint32_t filter0; /* R300_TX_FILTER0: 0x4400 */
162 uint32_t filter1; /* R300_TX_FILTER1: 0x4440 */
164 /* Min/max LOD must be clamped to [0, last_level], thus
165 * it's dependent on a currently bound texture */
166 unsigned min_lod, max_lod;
169 struct r300_texture_format_state {
170 uint32_t format0; /* R300_TX_FORMAT0: 0x4480 */
171 uint32_t format1; /* R300_TX_FORMAT1: 0x44c0 */
172 uint32_t format2; /* R300_TX_FORMAT2: 0x4500 */
173 uint32_t tile_config; /* R300_TX_OFFSET (subset thereof) */
176 struct r300_sampler_view {
177 struct pipe_sampler_view base;
179 /* Swizzles in the UTIL_FORMAT_SWIZZLE_* representation,
180 * derived from base. */
181 unsigned char swizzle[4];
183 /* Copy of r300_texture::texture_format_state with format-specific bits
185 struct r300_texture_format_state format;
187 /* The texture cache region for this texture. */
188 uint32_t texcache_region;
191 struct r300_texture_fb_state {
192 uint32_t pitch[R300_MAX_TEXTURE_LEVELS]; /* COLORPITCH or DEPTHPITCH. */
193 uint32_t format; /* US_OUT_FMT or R300_ZB_FORMAT */
196 struct r300_texture_sampler_state {
197 struct r300_texture_format_state format;
198 uint32_t filter0; /* R300_TX_FILTER0: 0x4400 */
199 uint32_t filter1; /* R300_TX_FILTER1: 0x4440 */
200 uint32_t border_color; /* R300_TX_BORDER_COLOR: 0x45c0 */
203 struct r300_textures_state {
205 struct r300_sampler_view *sampler_views[16];
206 int sampler_view_count;
207 /* Sampler states. */
208 struct r300_sampler_state *sampler_states[16];
209 int sampler_state_count;
211 /* This is the merge of the texture and sampler states. */
213 uint32_t tx_enable; /* R300_TX_ENABLE: 0x4101 */
214 struct r300_texture_sampler_state regs[16];
217 struct r300_vertex_stream_state {
218 /* R300_VAP_PROG_STREAK_CNTL_[0-7] */
219 uint32_t vap_prog_stream_cntl[8];
220 /* R300_VAP_PROG_STREAK_CNTL_EXT_[0-7] */
221 uint32_t vap_prog_stream_cntl_ext[8];
226 struct r300_invariant_state {
230 struct r300_vap_invariant_state {
234 struct r300_viewport_state {
235 float xscale; /* R300_VAP_VPORT_XSCALE: 0x2098 */
236 float xoffset; /* R300_VAP_VPORT_XOFFSET: 0x209c */
237 float yscale; /* R300_VAP_VPORT_YSCALE: 0x20a0 */
238 float yoffset; /* R300_VAP_VPORT_YOFFSET: 0x20a4 */
239 float zscale; /* R300_VAP_VPORT_ZSCALE: 0x20a8 */
240 float zoffset; /* R300_VAP_VPORT_ZOFFSET: 0x20ac */
241 uint32_t vte_control; /* R300_VAP_VTE_CNTL: 0x20b0 */
244 struct r300_ztop_state {
245 uint32_t z_buffer_top; /* R300_ZB_ZTOP: 0x4f14 */
248 /* The next several objects are not pure Radeon state; they inherit from
249 * various Gallium classes. */
251 struct r300_constant_buffer {
252 /* Buffer of constants */
254 /* Remapping table. */
255 unsigned *remap_table;
256 /* const buffer base */
257 uint32_t buffer_base;
262 * This is not a subclass of pipe_query because pipe_query is never
263 * actually fully defined. So, rather than have it as a member, and do
264 * subclass-style casting, we treat pipe_query as an opaque, and just
265 * trust that our state tracker does not ever mess up query objects.
268 /* The kind of query. Currently only OQ is supported. */
270 /* The number of pipes where query results are stored. */
272 /* How many results have been written, in dwords. It's incremented
273 * after end_query and flush. */
274 unsigned num_results;
275 /* if we've flushed the query */
277 /* if begin has been emitted */
278 boolean begin_emitted;
280 /* The buffer where query results are stored. */
281 struct r300_winsys_buffer *buffer;
282 struct r300_winsys_cs_buffer *cs_buffer;
283 /* The size of the buffer. */
284 unsigned buffer_size;
285 /* The domain of the buffer. */
286 enum r300_buffer_domain domain;
288 /* Linked list members. */
289 struct r300_query* prev;
290 struct r300_query* next;
295 * This is a fake fence. Instead of syncing with the fence, we sync
296 * with the context, which is inefficient but compliant.
298 * This is not a subclass of pipe_fence_handle because pipe_fence_handle is
299 * never actually fully defined. So, rather than have it as a member, and do
300 * subclass-style casting, we treat pipe_fence_handle as an opaque, and just
301 * trust that our state tracker does not ever mess up fence objects.
304 struct pipe_reference reference;
305 struct r300_context *ctx;
309 struct r300_surface {
310 struct pipe_surface base;
312 /* Winsys buffer backing the texture. */
313 struct r300_winsys_buffer *buffer;
314 struct r300_winsys_cs_buffer *cs_buffer;
316 enum r300_buffer_domain domain;
318 uint32_t offset; /* COLOROFFSET or DEPTHOFFSET. */
319 uint32_t pitch; /* COLORPITCH or DEPTHPITCH. */
320 uint32_t format; /* US_OUT_FMT or ZB_FORMAT. */
322 /* Parameters dedicated to the CBZB clear. */
323 uint32_t cbzb_width; /* Aligned width. */
324 uint32_t cbzb_height; /* Half of the height. */
325 uint32_t cbzb_midpoint_offset; /* DEPTHOFFSET. */
326 uint32_t cbzb_pitch; /* DEPTHPITCH. */
327 uint32_t cbzb_format; /* ZB_FORMAT. */
329 /* Whether the CBZB clear is allowed on the surface. */
330 boolean cbzb_allowed;
334 struct r300_texture_desc {
338 /* Width, height, and depth.
339 * Most of the time, these are equal to pipe_texture::width0, height0,
340 * and depth0. However, NPOT 3D textures must have dimensions aligned
341 * to POT, and this is the only case when these variables differ from
343 unsigned width0, height0, depth0;
346 * Macrotiling is specified per-level because small mipmaps cannot
348 enum r300_buffer_tiling microtile;
349 enum r300_buffer_tiling macrotile[R300_MAX_TEXTURE_LEVELS];
351 /* Offsets into the buffer. */
352 unsigned offset_in_bytes[R300_MAX_TEXTURE_LEVELS];
354 /* Strides for each mip-level. */
355 unsigned stride_in_pixels[R300_MAX_TEXTURE_LEVELS];
356 unsigned stride_in_bytes[R300_MAX_TEXTURE_LEVELS];
358 /* Size of one zslice or face or 2D image based on the texture target. */
359 unsigned layer_size_in_bytes[R300_MAX_TEXTURE_LEVELS];
361 /* Total size of this texture, in bytes,
362 * derived from the texture properties. */
363 unsigned size_in_bytes;
365 /* Total size of the buffer backing this texture, in bytes.
366 * It must be >= size. */
367 unsigned buffer_size_in_bytes;
370 * If non-zero, override the natural texture layout with
371 * a custom stride (in bytes).
373 * \note Mipmapping fails for textures with a non-natural layout!
375 * \sa r300_texture_get_stride
377 unsigned stride_in_bytes_override;
379 /* Whether this texture has non-power-of-two dimensions.
380 * It can be either a regular texture or a rectangle one. */
383 /* This flag says that hardware must use the stride for addressing
384 * instead of the width. */
385 boolean uses_stride_addressing;
387 /* Whether CBZB fast color clear is allowed on the miplevel. */
388 boolean cbzb_allowed[R300_MAX_TEXTURE_LEVELS];
390 /* Zbuffer compression info for each miplevel. */
391 boolean zcomp8x8[R300_MAX_TEXTURE_LEVELS];
392 /* If zero, then disable compression. */
393 unsigned zmask_dwords[R300_MAX_TEXTURE_LEVELS];
396 struct r300_texture {
397 struct r300_texture_desc desc;
399 enum r300_buffer_domain domain;
401 /* Pipe buffer backing this texture. */
402 struct r300_winsys_buffer *buffer;
403 struct r300_winsys_cs_buffer *cs_buffer;
405 /* Registers carrying texture format data. */
406 /* Only format-independent bits should be filled in. */
407 struct r300_texture_format_state tx_format;
408 /* All bits should be filled in. */
409 struct r300_texture_fb_state fb_state;
411 /* hyper-z memory allocs */
412 struct mem_block *hiz_mem[R300_MAX_TEXTURE_LEVELS];
413 boolean hiz_in_use[R300_MAX_TEXTURE_LEVELS];
415 /* This is the level tiling flags were last time set for.
416 * It's used to prevent redundant tiling-flags changes from happening.*/
417 unsigned surface_level;
420 struct r300_vertex_element_state {
422 struct pipe_vertex_element velem[PIPE_MAX_ATTRIBS];
423 unsigned format_size[PIPE_MAX_ATTRIBS];
425 struct u_vbuf_mgr_elements *vmgr_elements;
427 /* The size of the vertex, in dwords. */
428 unsigned vertex_size_dwords;
430 struct r300_vertex_stream_state vertex_stream;
433 struct r300_context {
435 struct pipe_context context;
437 /* The interface to the windowing system, etc. */
438 struct r300_winsys_screen *rws;
439 /* The command stream. */
440 struct r300_winsys_cs *cs;
442 struct r300_screen *screen;
444 /* Draw module. Used mostly for SW TCL. */
445 struct draw_context* draw;
446 /* Vertex buffer for SW TCL. */
447 struct pipe_resource* vbo;
448 /* Offset and size into the SW TCL VBO. */
449 size_t draw_vbo_offset;
450 size_t draw_vbo_size;
451 /* Whether the VBO must not be flushed. */
452 boolean draw_vbo_locked;
453 boolean draw_first_emitted;
455 /* Accelerated blit support. */
456 struct blitter_context* blitter;
457 /* Stencil two-sided reference value fallback. */
458 struct r300_stencilref_context *stencilref_fallback;
460 /* The KIL opcode needs the first texture unit to be enabled
461 * on r3xx-r4xx. In order to calm down the CS checker, we bind this
462 * dummy texture there. */
463 struct r300_sampler_view *texkill_sampler;
465 /* When no vertex buffer is set, this one is used instead to prevent
467 struct pipe_resource *dummy_vb;
469 /* The currently active query. */
470 struct r300_query *query_current;
471 /* The saved query for blitter operations. */
472 struct r300_query *blitter_saved_query;
474 struct r300_query query_list;
476 /* Various CSO state objects. */
478 /* Each atom is emitted in the order it appears here, which can affect
479 * performance and stability if not handled with care. */
481 struct r300_atom gpu_flush;
482 /* Anti-aliasing (MSAA) state. */
483 struct r300_atom aa_state;
484 /* Framebuffer state. */
485 struct r300_atom fb_state;
486 /* HyperZ state (various SC/ZB bits). */
487 struct r300_atom hyperz_state;
489 struct r300_atom ztop_state;
490 /* Depth, stencil, and alpha state. */
491 struct r300_atom dsa_state;
493 struct r300_atom blend_state;
494 /* Blend color state. */
495 struct r300_atom blend_color_state;
497 struct r300_atom scissor_state;
498 /* Invariant state. This must be emitted to get the engine started. */
499 struct r300_atom invariant_state;
500 /* Viewport state. */
501 struct r300_atom viewport_state;
503 struct r300_atom pvs_flush;
504 /* VAP invariant state. */
505 struct r300_atom vap_invariant_state;
506 /* Vertex stream formatting state. */
507 struct r300_atom vertex_stream_state;
509 struct r300_atom vs_state;
510 /* User clip planes. */
511 struct r300_atom clip_state;
512 /* RS block state + VAP (vertex shader) output mapping state. */
513 struct r300_atom rs_block_state;
514 /* Rasterizer state. */
515 struct r300_atom rs_state;
516 /* Framebuffer state (pipelined regs). */
517 struct r300_atom fb_state_pipelined;
518 /* Fragment shader. */
520 /* Fragment shader RC_CONSTANT_STATE variables. */
521 struct r300_atom fs_rc_constant_state;
522 /* Fragment shader constant buffer. */
523 struct r300_atom fs_constants;
524 /* Vertex shader constant buffer. */
525 struct r300_atom vs_constants;
526 /* Texture cache invalidate. */
527 struct r300_atom texture_cache_inval;
528 /* Textures state. */
529 struct r300_atom textures_state;
531 struct r300_atom hiz_clear;
533 struct r300_atom zmask_clear;
534 /* Occlusion query. */
535 struct r300_atom query_start;
537 /* The pointers to the first and the last atom. */
538 struct r300_atom *first_dirty, *last_dirty;
540 /* Vertex elements for Gallium. */
541 struct r300_vertex_element_state *velems;
543 struct pipe_index_buffer index_buffer;
545 /* Vertex info for Draw. */
546 struct vertex_info vertex_info;
548 struct pipe_stencil_ref stencil_ref;
549 struct pipe_viewport_state viewport;
551 /* Stream locations for SWTCL. */
552 int stream_loc_notcl[16];
554 /* Flag indicating whether or not the HW is dirty. */
556 /* Whether polygon offset is enabled. */
557 boolean polygon_offset_enabled;
558 /* Z buffer bit depth. */
559 uint32_t zbuffer_bpp;
560 /* Whether rendering is conditional and should be skipped. */
561 boolean skip_rendering;
562 /* Point sprites texcoord index, 1 bit per texcoord */
563 int sprite_coord_enable;
564 /* Whether two-sided color selection is enabled (AKA light_twoside). */
565 boolean two_sided_color;
568 /* Whether ZMASK is enabled. */
569 boolean zmask_in_use;
570 /* Whether ZMASK is being decompressed. */
571 boolean zmask_decompress;
572 /* Whether ZMASK is locked, i.e. should be disabled and cannot be taken over. */
573 boolean zmask_locked;
574 /* The zbuffer the ZMASK of which is locked. */
575 struct pipe_surface *locked_zbuffer;
577 void *dsa_decompress_zmask;
579 /* two mem block managers for hiz/zmask ram space */
580 struct mem_block *hiz_mm;
583 struct u_upload_mgr *upload_ib;
585 struct u_vbuf_mgr *vbuf_mgr;
587 struct util_slab_mempool pool_transfers;
590 uint64_t flush_counter;
592 /* const tracking for VS */
595 /* AOS (PACKET3_3D_LOAD_VBPNTR) command buffer for the case offset=0. */
596 uint32_t vertex_arrays_cb[(16 * 3 + 1) / 2];
597 boolean vertex_arrays_dirty;
599 /* Whether any buffer (FB, textures, VBOs) has been set, but buffers
600 * haven't been validated yet. */
601 boolean validate_buffers;
602 /* Whether user buffers have been validated. */
603 boolean upload_vb_validated;
604 boolean upload_ib_validated;
607 #define foreach_atom(r300, atom) \
608 for (atom = &r300->gpu_flush; atom != (&r300->query_start)+1; atom++)
610 #define foreach_dirty_atom(r300, atom) \
611 for (atom = r300->first_dirty; atom != r300->last_dirty; atom++)
613 /* Convenience cast wrappers. */
614 static INLINE struct r300_query* r300_query(struct pipe_query* q)
616 return (struct r300_query*)q;
619 static INLINE struct r300_surface* r300_surface(struct pipe_surface* surf)
621 return (struct r300_surface*)surf;
624 static INLINE struct r300_texture* r300_texture(struct pipe_resource* tex)
626 return (struct r300_texture*)tex;
629 static INLINE struct r300_context* r300_context(struct pipe_context* context)
631 return (struct r300_context*)context;
634 static INLINE struct r300_fragment_shader *r300_fs(struct r300_context *r300)
636 return (struct r300_fragment_shader*)r300->fs.state;
639 static INLINE void r300_mark_atom_dirty(struct r300_context *r300,
640 struct r300_atom *atom)
644 if (!r300->first_dirty) {
645 r300->first_dirty = atom;
646 r300->last_dirty = atom+1;
648 if (atom < r300->first_dirty)
649 r300->first_dirty = atom;
650 else if (atom+1 > r300->last_dirty)
651 r300->last_dirty = atom+1;
655 struct pipe_context* r300_create_context(struct pipe_screen* screen,
658 void r300_finish(struct r300_context *r300);
659 void r300_flush_cb(void *data);
661 /* Context initialization. */
662 struct draw_stage* r300_draw_stage(struct r300_context* r300);
663 void r300_init_blit_functions(struct r300_context *r300);
664 void r300_init_flush_functions(struct r300_context* r300);
665 void r300_init_query_functions(struct r300_context* r300);
666 void r300_init_render_functions(struct r300_context *r300);
667 void r300_init_state_functions(struct r300_context* r300);
668 void r300_init_resource_functions(struct r300_context* r300);
671 void r300_decompress_zmask(struct r300_context *r300);
672 void r300_decompress_zmask_locked_unsafe(struct r300_context *r300);
673 void r300_decompress_zmask_locked(struct r300_context *r300);
676 void r300_resume_query(struct r300_context *r300,
677 struct r300_query *query);
678 void r300_stop_query(struct r300_context *r300);
680 /* r300_render_translate.c */
681 void r300_translate_index_buffer(struct r300_context *r300,
682 struct pipe_resource **index_buffer,
683 unsigned *index_size, unsigned index_offset,
684 unsigned *start, unsigned count);
686 /* r300_render_stencilref.c */
687 void r300_plug_in_stencil_ref_fallback(struct r300_context *r300);
690 void r300_draw_flush_vbuf(struct r300_context *r300);
691 void r500_emit_index_bias(struct r300_context *r300, int index_bias);
694 enum r300_fb_state_change {
695 R300_CHANGED_FB_STATE = 0,
696 R300_CHANGED_HYPERZ_FLAG,
697 R300_CHANGED_MULTIWRITE
700 void r300_mark_fb_state_dirty(struct r300_context *r300,
701 enum r300_fb_state_change change);
702 void r300_mark_fs_code_dirty(struct r300_context *r300);
704 /* r300_state_derived.c */
705 void r300_update_derived_state(struct r300_context* r300);
708 void r500_dump_rs_block(struct r300_rs_block *rs);
711 static INLINE boolean CTX_DBG_ON(struct r300_context * ctx, unsigned flags)
713 return SCREEN_DBG_ON(ctx->screen, flags);
716 static INLINE void CTX_DBG(struct r300_context * ctx, unsigned flags,
717 const char * fmt, ...)
719 if (CTX_DBG_ON(ctx, flags)) {
722 vfprintf(stderr, fmt, va);
727 #define DBG_ON CTX_DBG_ON
730 #endif /* R300_CONTEXT_H */