;;
xnouveau)
PKG_CHECK_MODULES([NOUVEAU], [libdrm_nouveau >= $LIBDRM_NOUVEAU_REQUIRED])
- GALLIUM_DRIVERS_DIRS="$GALLIUM_DRIVERS_DIRS nouveau nvfx nv50 nvc0"
+ GALLIUM_DRIVERS_DIRS="$GALLIUM_DRIVERS_DIRS nouveau nv50 nvc0"
gallium_check_st "nouveau/drm" "dri-nouveau" "xorg-nouveau" "" "xvmc-nouveau" "vdpau-nouveau"
;;
xswrast)
#include "nouveau_context.h"
#include "nouveau_video.h"
-#include "nvfx/nvfx_context.h"
-#include "nvfx/nvfx_resource.h"
#include "nouveau/nouveau_bo.h"
#include "nouveau/nouveau_buffer.h"
#include "util/u_video.h"
#include "nouveau/nouveau_device.h"
#include "nouveau_winsys.h"
-static bool
-nouveau_video_is_nvfx(struct nouveau_decoder *dec) {
- if (dec->screen->device->chipset < 0x50)
- return true;
- if (dec->screen->device->chipset >= 0x60 && dec->screen->device->chipset < 0x70)
- return true;
- return false;
-}
-
static int
nouveau_vpe_init(struct nouveau_decoder *dec) {
int ret;
{
struct nouveau_video_buffer *buf = (struct nouveau_video_buffer *)buffer;
struct nouveau_channel *chan = dec->screen->channel;
- struct nouveau_bo *bo_y, *bo_c;
+ struct nouveau_bo *bo_y = ((struct nv04_resource *)buf->resources[0])->bo;
+ struct nouveau_bo *bo_c = ((struct nv04_resource *)buf->resources[1])->bo;
unsigned i;
if (!buf)
dec->surfaces[i] = buf;
dec->num_surfaces++;
- if (nouveau_video_is_nvfx(dec)) {
- bo_y = ((struct nvfx_resource *)buf->resources[0])->bo;
- bo_c = ((struct nvfx_resource *)buf->resources[1])->bo;
- } else {
- bo_y = ((struct nv04_resource *)buf->resources[0])->bo;
- bo_c = ((struct nv04_resource *)buf->resources[1])->bo;
- }
MARK_RING(chan, 3, 2);
BEGIN_RING(chan, dec->mpeg, NV31_MPEG_IMAGE_Y_OFFSET(i), 2);
OUT_RELOCl(chan, bo_y, 0, NOUVEAU_BO_RDWR);
}
static struct pipe_video_decoder *
-nvfx_context_create_decoder(struct pipe_context *context,
- enum pipe_video_profile profile,
- enum pipe_video_entrypoint entrypoint,
- enum pipe_video_chroma_format chroma_format,
- unsigned width, unsigned height,
- unsigned max_references, bool expect_chunked_decode)
-{
- struct nouveau_screen *screen = &nvfx_context(context)->screen->base;
- return nouveau_create_decoder(context, screen, profile, entrypoint,
- chroma_format, width, height,
- max_references, expect_chunked_decode);
-}
-
-static struct pipe_video_buffer *
-nvfx_context_video_buffer_create(struct pipe_context *pipe,
- const struct pipe_video_buffer *templat)
-{
- struct nouveau_screen *screen = &nvfx_context(pipe)->screen->base;
- return nouveau_video_buffer_create(pipe, screen, templat);
-}
-
-void
-nvfx_context_init_vdec(struct nvfx_context *nv)
-{
- nv->pipe.create_video_decoder = nvfx_context_create_decoder;
- nv->pipe.create_video_buffer = nvfx_context_video_buffer_create;
-}
-
-static struct pipe_video_decoder *
nouveau_context_create_decoder(struct pipe_context *context,
enum pipe_video_profile profile,
enum pipe_video_entrypoint entrypoint,
}
extern struct pipe_screen *
-nvfx_screen_create(struct nouveau_device *);
-
-extern struct pipe_screen *
nv50_screen_create(struct nouveau_device *);
extern struct pipe_screen *
+++ /dev/null
-# Mesa 3-D graphics library
-#
-# Copyright (C) 2011 Chia-I Wu <olvaffe@gmail.com>
-# Copyright (C) 2011 LunarG Inc.
-#
-# Permission is hereby granted, free of charge, to any person obtaining a
-# copy of this software and associated documentation files (the "Software"),
-# to deal in the Software without restriction, including without limitation
-# the rights to use, copy, modify, merge, publish, distribute, sublicense,
-# and/or sell copies of the Software, and to permit persons to whom the
-# Software is furnished to do so, subject to the following conditions:
-#
-# The above copyright notice and this permission notice shall be included
-# in all copies or substantial portions of the Software.
-#
-# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
-# THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
-# FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
-# DEALINGS IN THE SOFTWARE.
-
-LOCAL_PATH := $(call my-dir)
-
-# get C_SOURCES
-include $(LOCAL_PATH)/Makefile.sources
-
-include $(CLEAR_VARS)
-
-LOCAL_SRC_FILES := $(C_SOURCES)
-LOCAL_C_INCLUDES := $(DRM_TOP)
-
-LOCAL_MODULE := libmesa_pipe_nvfx
-
-include $(GALLIUM_COMMON_MK)
-include $(BUILD_STATIC_LIBRARY)
+++ /dev/null
-TOP = ../../../..
-include $(TOP)/configs/current
-
-LIBNAME = nvfx
-
-# get C_SOURCES
-include Makefile.sources
-
-LIBRARY_INCLUDES = \
- $(LIBDRM_CFLAGS) \
- -I$(TOP)/src/gallium/drivers/nouveau/include
-
-include ../../Makefile.template
-
-# FIXME: Remove when this driver is converted to automake.
-all: default
+++ /dev/null
-C_SOURCES := \
- nv04_2d.c \
- nvfx_buffer.c \
- nvfx_context.c \
- nvfx_clear.c \
- nvfx_draw.c \
- nvfx_fragprog.c \
- nvfx_fragtex.c \
- nv30_fragtex.c \
- nv40_fragtex.c \
- nvfx_miptree.c \
- nvfx_push.c \
- nvfx_query.c \
- nvfx_resource.c \
- nvfx_screen.c \
- nvfx_state.c \
- nvfx_state_emit.c \
- nvfx_state_fb.c \
- nvfx_surface.c \
- nvfx_transfer.c \
- nvfx_vbo.c \
- nvfx_vertprog.c
+++ /dev/null
-Import('*')
-
-env = env.Clone()
-
-env.PrependUnique(delete_existing=1, CPPPATH = [
- '#/src/gallium/drivers',
-])
-
-nvfx = env.ConvenienceLibrary(
- target = 'nvfx',
- source = env.ParseSourceList('Makefile.sources', 'C_SOURCES')
- )
-
-Export('nvfx')
+++ /dev/null
-#ifndef NV01_2D_XML
-#define NV01_2D_XML
-
-/* Autogenerated file, DO NOT EDIT manually!
-
-This file was generated by the rules-ng-ng headergen tool in this git repository:
-http://0x04.net/cgit/index.cgi/rules-ng-ng
-git clone git://0x04.net/rules-ng-ng
-
-The rules-ng-ng source files this header was generated from are:
-- nv01_2d.xml ( 33462 bytes, from 2010-08-05 19:38:53)
-- copyright.xml ( 6503 bytes, from 2010-04-10 23:15:50)
-- nv_defs.xml ( 4437 bytes, from 2010-08-05 19:38:53)
-- nv_object.xml ( 10424 bytes, from 2010-08-05 19:38:53)
-- nvchipsets.xml ( 2824 bytes, from 2010-08-05 19:38:53)
-
-Copyright (C) 2006-2010 by the following authors:
-- Artur Huillet <arthur.huillet@free.fr> (ahuillet)
-- Ben Skeggs (darktama, darktama_)
-- B. R. <koala_br@users.sourceforge.net> (koala_br)
-- Carlos Martin <carlosmn@users.sf.net> (carlosmn)
-- Christoph Bumiller <e0425955@student.tuwien.ac.at> (calim, chrisbmr)
-- Dawid Gajownik <gajownik@users.sf.net> (gajownik)
-- Dmitry Baryshkov
-- Dmitry Eremin-Solenikov <lumag@users.sf.net> (lumag)
-- EdB <edb_@users.sf.net> (edb_)
-- Erik Waling <erikwailing@users.sf.net> (erikwaling)
-- Francisco Jerez <currojerez@riseup.net> (curro, curro_, currojerez)
-- imirkin <imirkin@users.sf.net> (imirkin)
-- jb17bsome <jb17bsome@bellsouth.net> (jb17bsome)
-- Jeremy Kolb <kjeremy@users.sf.net> (kjeremy)
-- Laurent Carlier <lordheavym@gmail.com> (lordheavy)
-- Luca Barbieri <luca@luca-barbieri.com> (lb, lb1)
-- Maarten Maathuis <madman2003@gmail.com> (stillunknown)
-- Marcin Kościelnicki <koriakin@0x04.net> (mwk, koriakin)
-- Mark Carey <mark.carey@gmail.com> (careym)
-- Matthieu Castet <matthieu.castet@parrot.com> (mat-c)
-- nvidiaman <nvidiaman@users.sf.net> (nvidiaman)
-- Patrice Mandin <mandin.patrice@orange.fr> (pmandin, pmdata)
-- Pekka Paalanen <pq@iki.fi> (pq, ppaalanen)
-- Peter Popov <ironpeter@users.sf.net> (ironpeter)
-- Richard Hughes <hughsient@users.sf.net> (hughsient)
-- Rudi Cilibrasi <cilibrar@users.sf.net> (cilibrar)
-- Serge Martin
-- Simon Raffeiner
-- Stephane Loeuillet <leroutier@users.sf.net> (leroutier)
-- Stephane Marchesin <stephane.marchesin@gmail.com> (marcheu)
-- sturmflut <sturmflut@users.sf.net> (sturmflut)
-- Sylvain Munaut <tnt@246tNt.com>
-- Victor Stinner <victor.stinner@haypocalc.com> (haypo)
-- Wladmir van der Laan <laanwj@gmail.com> (miathan6)
-- Younes Manton <younes.m@gmail.com> (ymanton)
-
-Permission is hereby granted, free of charge, to any person obtaining
-a copy of this software and associated documentation files (the
-"Software"), to deal in the Software without restriction, including
-without limitation the rights to use, copy, modify, merge, publish,
-distribute, sublicense, and/or sell copies of the Software, and to
-permit persons to whom the Software is furnished to do so, subject to
-the following conditions:
-
-The above copyright notice and this permission notice (including the
-next paragraph) shall be included in all copies or substantial
-portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
-EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
-MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
-IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
-LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
-OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
-WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
-*/
-
-
-
-#define NV01_CONTEXT_BETA1_DMA_NOTIFY 0x00000180
-
-#define NV01_CONTEXT_BETA1_BETA_1D31 0x00000300
-
-
-#define NV04_BETA_SOLID_DMA_NOTIFY 0x00000180
-
-#define NV04_BETA_SOLID_BETA_FACTOR 0x00000300
-
-
-#define NV01_CONTEXT_COLOR_KEY_DMA_NOTIFY 0x00000180
-
-#define NV01_CONTEXT_COLOR_KEY_COLOR_FORMAT 0x00000300
-#define NV01_CONTEXT_COLOR_KEY_COLOR_FORMAT_A16R5G6B5 0x00000001
-#define NV01_CONTEXT_COLOR_KEY_COLOR_FORMAT_X16A1R5G5B5 0x00000002
-#define NV01_CONTEXT_COLOR_KEY_COLOR_FORMAT_A8R8G8B8 0x00000003
-
-#define NV01_CONTEXT_COLOR_KEY_COLOR 0x00000304
-
-
-#define NV01_CONTEXT_PATTERN_DMA_NOTIFY 0x00000180
-
-#define NV01_CONTEXT_PATTERN_COLOR_FORMAT 0x00000300
-
-#define NV01_CONTEXT_PATTERN_MONOCHROME_FORMAT 0x00000304
-
-#define NV01_CONTEXT_PATTERN_SHAPE 0x00000308
-
-#define NV01_CONTEXT_PATTERN_COLOR(i0) (0x00000310 + 0x4*(i0))
-#define NV01_CONTEXT_PATTERN_COLOR__ESIZE 0x00000004
-#define NV01_CONTEXT_PATTERN_COLOR__LEN 0x00000002
-
-#define NV01_CONTEXT_PATTERN_PATTERN(i0) (0x00000318 + 0x4*(i0))
-#define NV01_CONTEXT_PATTERN_PATTERN__ESIZE 0x00000004
-#define NV01_CONTEXT_PATTERN_PATTERN__LEN 0x00000002
-
-
-#define NV01_CONTEXT_CLIP_RECTANGLE_DMA_NOTIFY 0x00000180
-
-#define NV01_CONTEXT_CLIP_RECTANGLE_POINT 0x00000300
-#define NV01_CONTEXT_CLIP_RECTANGLE_POINT_X__MASK 0x0000ffff
-#define NV01_CONTEXT_CLIP_RECTANGLE_POINT_X__SHIFT 0
-#define NV01_CONTEXT_CLIP_RECTANGLE_POINT_Y__MASK 0xffff0000
-#define NV01_CONTEXT_CLIP_RECTANGLE_POINT_Y__SHIFT 16
-
-#define NV01_CONTEXT_CLIP_RECTANGLE_SIZE 0x00000304
-#define NV01_CONTEXT_CLIP_RECTANGLE_SIZE_W__MASK 0x0000ffff
-#define NV01_CONTEXT_CLIP_RECTANGLE_SIZE_W__SHIFT 0
-#define NV01_CONTEXT_CLIP_RECTANGLE_SIZE_H__MASK 0xffff0000
-#define NV01_CONTEXT_CLIP_RECTANGLE_SIZE_H__SHIFT 16
-
-
-#define NV04_CONTEXT_SURFACES_2D_DMA_NOTIFY 0x00000180
-
-#define NV04_CONTEXT_SURFACES_2D_DMA_IMAGE_SOURCE 0x00000184
-
-#define NV04_CONTEXT_SURFACES_2D_DMA_IMAGE_DESTIN 0x00000188
-
-
-#define NV50_CONTEXT_SURFACES_2D_SRC_LINEAR 0x00000200
-
-#define NV50_CONTEXT_SURFACES_2D_SRC_TILE_MODE 0x00000204
-
-#define NV50_CONTEXT_SURFACES_2D_SRC_WIDTH 0x00000208
-
-#define NV50_CONTEXT_SURFACES_2D_SRC_HEIGHT 0x0000020c
-
-#define NV50_CONTEXT_SURFACES_2D_UNK0210 0x00000210
-
-#define NV50_CONTEXT_SURFACES_2D_UNK0214 0x00000214
-
-#define NV50_CONTEXT_SURFACES_2D_DST_LINEAR 0x00000218
-
-#define NV50_CONTEXT_SURFACES_2D_DST_TILE_MODE 0x0000021c
-
-#define NV50_CONTEXT_SURFACES_2D_DST_WIDTH 0x00000220
-
-#define NV50_CONTEXT_SURFACES_2D_DST_HEIGHT 0x00000224
-
-#define NV50_CONTEXT_SURFACES_2D_UNK0228 0x00000228
-
-#define NV50_CONTEXT_SURFACES_2D_UNK022C 0x0000022c
-
-#define NV50_CONTEXT_SURFACES_2D_OFFSET_SOURCE_HIGH 0x00000230
-
-#define NV50_CONTEXT_SURFACES_2D_OFFSET_DESTIN_HIGH 0x00000234
-
-#define NV04_CONTEXT_SURFACES_2D_FORMAT 0x00000300
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_Y8 0x00000001
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_X1R5G5B5_Z1R5G5B5 0x00000002
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_X1R5G5B5_X1R5G5B5 0x00000003
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_R5G6B5 0x00000004
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_Y16 0x00000005
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_X8R8G8B8_Z8R8G8B8 0x00000006
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_X8R8G8B8_X8R8G8B8 0x00000007
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_X1A7R8G8B8_Z1A7R8G8B8 0x00000008
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_X1A7R8G8B8_X1A7R8G8B8 0x00000009
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_A8R8G8B8 0x0000000a
-#define NV04_CONTEXT_SURFACES_2D_FORMAT_Y32 0x0000000b
-
-#define NV04_CONTEXT_SURFACES_2D_PITCH 0x00000304
-#define NV04_CONTEXT_SURFACES_2D_PITCH_SOURCE__MASK 0x0000ffff
-#define NV04_CONTEXT_SURFACES_2D_PITCH_SOURCE__SHIFT 0
-#define NV04_CONTEXT_SURFACES_2D_PITCH_DESTIN__MASK 0xffff0000
-#define NV04_CONTEXT_SURFACES_2D_PITCH_DESTIN__SHIFT 16
-
-#define NV04_CONTEXT_SURFACES_2D_OFFSET_SOURCE 0x00000308
-
-#define NV04_CONTEXT_SURFACES_2D_OFFSET_DESTIN 0x0000030c
-
-
-#define NV04_SWIZZLED_SURFACE_DMA_NOTIFY 0x00000180
-
-#define NV04_SWIZZLED_SURFACE_DMA_IMAGE 0x00000184
-
-#define NV04_SWIZZLED_SURFACE_FORMAT 0x00000300
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR__MASK 0x000000ff
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR__SHIFT 0
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_Y8 0x00000001
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_X1R5G5B5_Z1R5G5B5 0x00000002
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_X1R5G5B5_X1R5G5B5 0x00000003
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_R5G6B5 0x00000004
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_Y16 0x00000005
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_X8R8G8B8_Z8R8G8B8 0x00000006
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_X8R8G8B8_X8R8G8B8 0x00000007
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_X1A7R8G8B8_Z1A7R8G8B8 0x00000008
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_X1A7R8G8B8_X1A7R8G8B8 0x00000009
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_A8R8G8B8 0x0000000a
-#define NV04_SWIZZLED_SURFACE_FORMAT_COLOR_Y32 0x0000000b
-#define NV04_SWIZZLED_SURFACE_FORMAT_BASE_SIZE_U__MASK 0x00ff0000
-#define NV04_SWIZZLED_SURFACE_FORMAT_BASE_SIZE_U__SHIFT 16
-#define NV04_SWIZZLED_SURFACE_FORMAT_BASE_SIZE_V__MASK 0xff000000
-#define NV04_SWIZZLED_SURFACE_FORMAT_BASE_SIZE_V__SHIFT 24
-
-#define NV04_SWIZZLED_SURFACE_OFFSET 0x00000304
-
-
-#define NV03_CONTEXT_ROP_DMA_NOTIFY 0x00000180
-
-#define NV03_CONTEXT_ROP_ROP 0x00000300
-
-
-#define NV04_IMAGE_PATTERN_DMA_NOTIFY 0x00000180
-
-#define NV04_IMAGE_PATTERN_COLOR_FORMAT 0x00000300
-#define NV04_IMAGE_PATTERN_COLOR_FORMAT_A16R5G6B5 0x00000001
-#define NV04_IMAGE_PATTERN_COLOR_FORMAT_X16A1R5G5B5 0x00000002
-#define NV04_IMAGE_PATTERN_COLOR_FORMAT_A8R8G8B8 0x00000003
-
-#define NV04_IMAGE_PATTERN_MONOCHROME_FORMAT 0x00000304
-#define NV04_IMAGE_PATTERN_MONOCHROME_FORMAT_CGA6 0x00000001
-#define NV04_IMAGE_PATTERN_MONOCHROME_FORMAT_LE 0x00000002
-
-#define NV04_IMAGE_PATTERN_MONOCHROME_SHAPE 0x00000308
-#define NV04_IMAGE_PATTERN_MONOCHROME_SHAPE_8X8 0x00000000
-#define NV04_IMAGE_PATTERN_MONOCHROME_SHAPE_64X1 0x00000001
-#define NV04_IMAGE_PATTERN_MONOCHROME_SHAPE_1X64 0x00000002
-
-#define NV04_IMAGE_PATTERN_PATTERN_SELECT 0x0000030c
-#define NV04_IMAGE_PATTERN_PATTERN_SELECT_MONO 0x00000001
-#define NV04_IMAGE_PATTERN_PATTERN_SELECT_COLOR 0x00000002
-
-#define NV04_IMAGE_PATTERN_MONOCHROME_COLOR0 0x00000310
-
-#define NV04_IMAGE_PATTERN_MONOCHROME_COLOR1 0x00000314
-
-#define NV04_IMAGE_PATTERN_MONOCHROME_PATTERN0 0x00000318
-
-#define NV04_IMAGE_PATTERN_MONOCHROME_PATTERN1 0x0000031c
-
-#define NV04_IMAGE_PATTERN_PATTERN_Y8(i0) (0x00000400 + 0x4*(i0))
-#define NV04_IMAGE_PATTERN_PATTERN_Y8__ESIZE 0x00000004
-#define NV04_IMAGE_PATTERN_PATTERN_Y8__LEN 0x00000010
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y0__MASK 0x000000ff
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y0__SHIFT 0
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y1__MASK 0x0000ff00
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y1__SHIFT 8
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y2__MASK 0x00ff0000
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y2__SHIFT 16
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y3__MASK 0xff000000
-#define NV04_IMAGE_PATTERN_PATTERN_Y8_Y3__SHIFT 24
-
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5(i0) (0x00000500 + 0x4*(i0))
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5__ESIZE 0x00000004
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5__LEN 0x00000020
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_B0__MASK 0x0000001f
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_B0__SHIFT 0
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_G0__MASK 0x000007e0
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_G0__SHIFT 5
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_R0__MASK 0x0000f800
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_R0__SHIFT 11
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_B1__MASK 0x001f0000
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_B1__SHIFT 16
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_G1__MASK 0x07e00000
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_G1__SHIFT 21
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_R1__MASK 0xf8000000
-#define NV04_IMAGE_PATTERN_PATTERN_R5G6B5_R1__SHIFT 27
-
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5(i0) (0x00000600 + 0x4*(i0))
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5__ESIZE 0x00000004
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5__LEN 0x00000020
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_B0__MASK 0x0000001f
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_B0__SHIFT 0
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_G0__MASK 0x000003e0
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_G0__SHIFT 5
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_R0__MASK 0x00007c00
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_R0__SHIFT 10
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_B1__MASK 0x001f0000
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_B1__SHIFT 16
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_G1__MASK 0x03e00000
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_G1__SHIFT 21
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_R1__MASK 0x7c000000
-#define NV04_IMAGE_PATTERN_PATTERN_X1R5G5B5_R1__SHIFT 26
-
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8(i0) (0x00000700 + 0x4*(i0))
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8__ESIZE 0x00000004
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8__LEN 0x00000040
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8_B__MASK 0x000000ff
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8_B__SHIFT 0
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8_G__MASK 0x0000ff00
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8_G__SHIFT 8
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8_R__MASK 0x00ff0000
-#define NV04_IMAGE_PATTERN_PATTERN_X8R8G8B8_R__SHIFT 16
-
-
-#define NV01_RENDER_SOLID_LINE_PATCH 0x0000010c
-
-#define NV01_RENDER_SOLID_LINE_DMA_NOTIFY 0x00000180
-
-#define NV01_RENDER_SOLID_LINE_CLIP_RECTANGLE 0x00000184
-
-#define NV01_RENDER_SOLID_LINE_PATTERN 0x00000188
-
-#define NV04_RENDER_SOLID_LINE_PATTERN 0x00000188
-
-#define NV01_RENDER_SOLID_LINE_ROP 0x0000018c
-
-#define NV01_RENDER_SOLID_LINE_BETA1 0x00000190
-
-#define NV01_RENDER_SOLID_LINE_SURFACE_DST 0x00000194
-
-
-#define NV04_RENDER_SOLID_LINE_BETA4 0x00000194
-
-#define NV04_RENDER_SOLID_LINE_SURFACE 0x00000198
-
-#define NV01_RENDER_SOLID_LINE_OPERATION 0x000002fc
-#define NV01_RENDER_SOLID_LINE_OPERATION_SRCCOPY_AND 0x00000000
-#define NV01_RENDER_SOLID_LINE_OPERATION_ROP_AND 0x00000001
-#define NV01_RENDER_SOLID_LINE_OPERATION_BLEND_AND 0x00000002
-#define NV01_RENDER_SOLID_LINE_OPERATION_SRCCOPY 0x00000003
-#define NV01_RENDER_SOLID_LINE_OPERATION_SRCCOPY_PREMULT 0x00000004
-#define NV01_RENDER_SOLID_LINE_OPERATION_BLEND_PREMULT 0x00000005
-
-#define NV01_RENDER_SOLID_LINE_COLOR_FORMAT 0x00000300
-#define NV01_RENDER_SOLID_LINE_COLOR_FORMAT_A16R5G6B5 0x00000001
-#define NV01_RENDER_SOLID_LINE_COLOR_FORMAT_X16A1R5G5B5 0x00000002
-#define NV01_RENDER_SOLID_LINE_COLOR_FORMAT_A8R8G8B8 0x00000003
-
-#define NV01_RENDER_SOLID_LINE_COLOR 0x00000304
-
-#define NV01_RENDER_SOLID_LINE_LINE_POINT0(i0) (0x00000400 + 0x8*(i0))
-#define NV01_RENDER_SOLID_LINE_LINE_POINT0__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_LINE_LINE_POINT0__LEN 0x00000010
-#define NV01_RENDER_SOLID_LINE_LINE_POINT0_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_LINE_LINE_POINT0_X__SHIFT 0
-#define NV01_RENDER_SOLID_LINE_LINE_POINT0_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_LINE_LINE_POINT0_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_LINE_LINE_POINT1(i0) (0x00000404 + 0x8*(i0))
-#define NV01_RENDER_SOLID_LINE_LINE_POINT1__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_LINE_LINE_POINT1__LEN 0x00000010
-#define NV01_RENDER_SOLID_LINE_LINE_POINT1_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_LINE_LINE_POINT1_X__SHIFT 0
-#define NV01_RENDER_SOLID_LINE_LINE_POINT1_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_LINE_LINE_POINT1_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT0_X(i0) (0x00000480 + 0x10*(i0))
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT0_X__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT0_X__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT0_Y(i0) (0x00000484 + 0x10*(i0))
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT0_Y__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT0_Y__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT1_X(i0) (0x00000488 + 0x10*(i0))
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT1_X__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT1_X__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT1_Y(i0) (0x0000048c + 0x10*(i0))
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT1_Y__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_LINE_LINE32_POINT1_Y__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_LINE_POLYLINE(i0) (0x00000500 + 0x4*(i0))
-#define NV01_RENDER_SOLID_LINE_POLYLINE__ESIZE 0x00000004
-#define NV01_RENDER_SOLID_LINE_POLYLINE__LEN 0x00000020
-#define NV01_RENDER_SOLID_LINE_POLYLINE_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_LINE_POLYLINE_X__SHIFT 0
-#define NV01_RENDER_SOLID_LINE_POLYLINE_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_LINE_POLYLINE_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_LINE_POLYLINE32_POINT_X(i0) (0x00000580 + 0x8*(i0))
-#define NV01_RENDER_SOLID_LINE_POLYLINE32_POINT_X__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_LINE_POLYLINE32_POINT_X__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_LINE_POLYLINE32_POINT_Y(i0) (0x00000584 + 0x8*(i0))
-#define NV01_RENDER_SOLID_LINE_POLYLINE32_POINT_Y__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_LINE_POLYLINE32_POINT_Y__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_COLOR(i0) (0x00000600 + 0x8*(i0))
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_COLOR__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_COLOR__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_POINT(i0) (0x00000604 + 0x8*(i0))
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_POINT__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_POINT__LEN 0x00000010
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_POINT_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_POINT_X__SHIFT 0
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_POINT_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_LINE_CPOLYLINE_POINT_Y__SHIFT 16
-
-
-#define NV01_RENDER_SOLID_TRIANGLE_PATCH 0x0000010c
-
-#define NV01_RENDER_SOLID_TRIANGLE_DMA_NOTIFY 0x00000180
-
-#define NV01_RENDER_SOLID_TRIANGLE_CLIP_RECTANGLE 0x00000184
-
-#define NV01_RENDER_SOLID_TRIANGLE_PATTERN 0x00000188
-
-#define NV04_RENDER_SOLID_TRIANGLE_PATTERN 0x00000188
-
-#define NV01_RENDER_SOLID_TRIANGLE_ROP 0x0000018c
-
-#define NV01_RENDER_SOLID_TRIANGLE_BETA1 0x00000190
-
-#define NV01_RENDER_SOLID_TRIANGLE_SURFACE_DST 0x00000194
-
-
-#define NV04_RENDER_SOLID_TRIANGLE_BETA4 0x00000194
-
-#define NV04_RENDER_SOLID_TRIANGLE_SURFACE 0x00000198
-
-#define NV01_RENDER_SOLID_TRIANGLE_OPERATION 0x000002fc
-#define NV01_RENDER_SOLID_TRIANGLE_OPERATION_SRCCOPY_AND 0x00000000
-#define NV01_RENDER_SOLID_TRIANGLE_OPERATION_ROP_AND 0x00000001
-#define NV01_RENDER_SOLID_TRIANGLE_OPERATION_BLEND_AND 0x00000002
-#define NV01_RENDER_SOLID_TRIANGLE_OPERATION_SRCCOPY 0x00000003
-#define NV01_RENDER_SOLID_TRIANGLE_OPERATION_SRCCOPY_PREMULT 0x00000004
-#define NV01_RENDER_SOLID_TRIANGLE_OPERATION_BLEND_PREMULT 0x00000005
-
-#define NV01_RENDER_SOLID_TRIANGLE_COLOR_FORMAT 0x00000300
-#define NV01_RENDER_SOLID_TRIANGLE_COLOR_FORMAT_A16R5G6B5 0x00000001
-#define NV01_RENDER_SOLID_TRIANGLE_COLOR_FORMAT_X16A1R5G5B5 0x00000002
-#define NV01_RENDER_SOLID_TRIANGLE_COLOR_FORMAT_A8R8G8B8 0x00000003
-
-#define NV01_RENDER_SOLID_TRIANGLE_COLOR 0x00000304
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT0 0x00000310
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT0_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT0_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT0_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT0_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT1 0x00000314
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT1_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT1_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT1_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT1_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT2 0x00000318
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT2_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT2_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT2_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE_POINT2_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE32_POINT0_X 0x00000320
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE32_POINT0_Y 0x00000324
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE32_POINT1_X 0x00000328
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE32_POINT1_Y 0x0000032c
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE32_POINT2_X 0x00000330
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIANGLE32_POINT2_Y 0x00000334
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH(i0) (0x00000400 + 0x4*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH__ESIZE 0x00000004
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH__LEN 0x00000020
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH32_POINT_X(i0) (0x00000480 + 0x8*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH32_POINT_X__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH32_POINT_X__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH32_POINT_Y(i0) (0x00000484 + 0x8*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH32_POINT_Y__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_TRIANGLE_TRIMESH32_POINT_Y__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_COLOR(i0) (0x00000500 + 0x10*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_COLOR__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_COLOR__LEN 0x00000008
-
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT0(i0) (0x00000504 + 0x10*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT0__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT0__LEN 0x00000008
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT0_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT0_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT0_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT0_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT1(i0) (0x00000508 + 0x10*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT1__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT1__LEN 0x00000008
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT1_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT1_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT1_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT1_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT2(i0) (0x0000050c + 0x10*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT2__ESIZE 0x00000010
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT2__LEN 0x00000008
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT2_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT2_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT2_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIANGLE_POINT2_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_COLOR(i0) (0x00000580 + 0x8*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_COLOR__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_COLOR__LEN 0x00000010
-
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_POINT(i0) (0x00000584 + 0x8*(i0))
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_POINT__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_POINT__LEN 0x00000010
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_POINT_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_POINT_X__SHIFT 0
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_POINT_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_TRIANGLE_CTRIMESH_POINT_Y__SHIFT 16
-
-
-#define NV01_RENDER_SOLID_RECTANGLE_PATCH 0x0000010c
-
-#define NV01_RENDER_SOLID_RECTANGLE_DMA_NOTIFY 0x00000180
-
-#define NV01_RENDER_SOLID_RECTANGLE_CLIP_RECTANGLE 0x00000184
-
-#define NV01_RENDER_SOLID_RECTANGLE_PATTERN 0x00000188
-
-#define NV04_RENDER_SOLID_RECTANGLE_PATTERN 0x00000188
-
-#define NV01_RENDER_SOLID_RECTANGLE_ROP 0x0000018c
-
-#define NV01_RENDER_SOLID_RECTANGLE_BETA1 0x00000190
-
-#define NV01_RENDER_SOLID_RECTANGLE_SURFACE_DST 0x00000194
-
-
-#define NV04_RENDER_SOLID_RECTANGLE_BETA4 0x00000194
-
-#define NV04_RENDER_SOLID_RECTANGLE_SURFACE 0x00000198
-
-#define NV01_RENDER_SOLID_RECTANGLE_OPERATION 0x000002fc
-#define NV01_RENDER_SOLID_RECTANGLE_OPERATION_SRCCOPY_AND 0x00000000
-#define NV01_RENDER_SOLID_RECTANGLE_OPERATION_ROP_AND 0x00000001
-#define NV01_RENDER_SOLID_RECTANGLE_OPERATION_BLEND_AND 0x00000002
-#define NV01_RENDER_SOLID_RECTANGLE_OPERATION_SRCCOPY 0x00000003
-#define NV01_RENDER_SOLID_RECTANGLE_OPERATION_SRCCOPY_PREMULT 0x00000004
-#define NV01_RENDER_SOLID_RECTANGLE_OPERATION_BLEND_PREMULT 0x00000005
-
-#define NV01_RENDER_SOLID_RECTANGLE_COLOR_FORMAT 0x00000300
-#define NV01_RENDER_SOLID_RECTANGLE_COLOR_FORMAT_A16R5G6B5 0x00000001
-#define NV01_RENDER_SOLID_RECTANGLE_COLOR_FORMAT_X16A1R5G5B5 0x00000002
-#define NV01_RENDER_SOLID_RECTANGLE_COLOR_FORMAT_A8R8G8B8 0x00000003
-
-#define NV01_RENDER_SOLID_RECTANGLE_COLOR 0x00000304
-
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_POINT(i0) (0x00000400 + 0x8*(i0))
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_POINT__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_POINT__LEN 0x00000010
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_POINT_X__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_POINT_X__SHIFT 0
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_POINT_Y__MASK 0xffff0000
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_POINT_Y__SHIFT 16
-
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_SIZE(i0) (0x00000404 + 0x8*(i0))
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_SIZE__ESIZE 0x00000008
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_SIZE__LEN 0x00000010
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_SIZE_W__MASK 0x0000ffff
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_SIZE_W__SHIFT 0
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_SIZE_H__MASK 0xffff0000
-#define NV01_RENDER_SOLID_RECTANGLE_RECTANGLE_SIZE_H__SHIFT 16
-
-
-#define NV01_IMAGE_BLIT_PATCH 0x0000010c
-
-
-#define NV11_IMAGE_BLIT_WAIT_FOR_IDLE 0x00000108
-
-#define NV11_IMAGE_BLIT_UNK120 0x00000120
-
-#define NV11_IMAGE_BLIT_UNK124 0x00000124
-
-#define NV11_IMAGE_BLIT_UNK128 0x00000128
-
-#define NV11_IMAGE_BLIT_UNK12C 0x0000012c
-
-#define NV11_IMAGE_BLIT_UNK130 0x00000130
-
-#define NV11_IMAGE_BLIT_UNK134 0x00000134
-
-#define NV01_IMAGE_BLIT_DMA_NOTIFY 0x00000180
-
-#define NV01_IMAGE_BLIT_COLOR_KEY 0x00000184
-
-#define NV04_IMAGE_BLIT_COLOR_KEY 0x00000184
-
-#define NV01_IMAGE_BLIT_CLIP_RECTANGLE 0x00000188
-
-#define NV01_IMAGE_BLIT_PATTERN 0x0000018c
-
-#define NV04_IMAGE_BLIT_PATTERN 0x0000018c
-
-#define NV01_IMAGE_BLIT_ROP 0x00000190
-
-#define NV01_IMAGE_BLIT_BETA1 0x00000194
-
-
-#define NV01_IMAGE_BLIT_SURFACE_SRC 0x00000198
-
-#define NV01_IMAGE_BLIT_SURFACE_DST 0x0000019c
-
-
-#define NV04_IMAGE_BLIT_BETA4 0x00000198
-
-#define NV04_IMAGE_BLIT_SURFACES 0x0000019c
-
-#define NV01_IMAGE_BLIT_OPERATION 0x000002fc
-#define NV01_IMAGE_BLIT_OPERATION_SRCCOPY_AND 0x00000000
-#define NV01_IMAGE_BLIT_OPERATION_ROP_AND 0x00000001
-#define NV01_IMAGE_BLIT_OPERATION_BLEND_AND 0x00000002
-#define NV01_IMAGE_BLIT_OPERATION_SRCCOPY 0x00000003
-#define NV01_IMAGE_BLIT_OPERATION_SRCCOPY_PREMULT 0x00000004
-#define NV01_IMAGE_BLIT_OPERATION_BLEND_PREMULT 0x00000005
-
-#define NV01_IMAGE_BLIT_POINT_IN 0x00000300
-#define NV01_IMAGE_BLIT_POINT_IN_X__MASK 0x0000ffff
-#define NV01_IMAGE_BLIT_POINT_IN_X__SHIFT 0
-#define NV01_IMAGE_BLIT_POINT_IN_Y__MASK 0xffff0000
-#define NV01_IMAGE_BLIT_POINT_IN_Y__SHIFT 16
-
-#define NV01_IMAGE_BLIT_POINT_OUT 0x00000304
-#define NV01_IMAGE_BLIT_POINT_OUT_X__MASK 0x0000ffff
-#define NV01_IMAGE_BLIT_POINT_OUT_X__SHIFT 0
-#define NV01_IMAGE_BLIT_POINT_OUT_Y__MASK 0xffff0000
-#define NV01_IMAGE_BLIT_POINT_OUT_Y__SHIFT 16
-
-#define NV01_IMAGE_BLIT_SIZE 0x00000308
-#define NV01_IMAGE_BLIT_SIZE_W__MASK 0x0000ffff
-#define NV01_IMAGE_BLIT_SIZE_W__SHIFT 0
-#define NV01_IMAGE_BLIT_SIZE_H__MASK 0xffff0000
-#define NV01_IMAGE_BLIT_SIZE_H__SHIFT 16
-
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_PATCH 0x0000010c
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_DMA_NOTIFY 0x00000180
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_DMA_LUT 0x00000184
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_COLOR_KEY 0x00000188
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_CLIP_RECTANGLE 0x0000018c
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_PATTERN 0x00000190
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_ROP 0x00000194
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_BETA1 0x00000198
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_BETA4 0x0000019c
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_SURFACE 0x000001a0
-
-#define NV05_INDEXED_IMAGE_FROM_CPU_SURFACE 0x000001a0
-
-#define NV05_INDEXED_IMAGE_FROM_CPU_COLOR_CONVERSION 0x000003e0
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_OPERATION 0x000003e4
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_COLOR_FORMAT 0x000003e8
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_INDEX_FORMAT 0x000003ec
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_LUT_OFFSET 0x000003f0
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_POINT 0x000003f4
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_SIZE_OUT 0x000003f8
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_SIZE_IN 0x000003fc
-
-#define NV04_INDEXED_IMAGE_FROM_CPU_COLOR(i0) (0x00000400 + 0x4*(i0))
-#define NV04_INDEXED_IMAGE_FROM_CPU_COLOR__ESIZE 0x00000004
-#define NV04_INDEXED_IMAGE_FROM_CPU_COLOR__LEN 0x00000700
-
-
-#define NV10_IMAGE_FROM_CPU_WAIT_FOR_IDLE 0x00000108
-
-#define NV01_IMAGE_FROM_CPU_PATCH 0x0000010c
-
-#define NV01_IMAGE_FROM_CPU_DMA_NOTIFY 0x00000180
-
-#define NV01_IMAGE_FROM_CPU_COLOR_KEY 0x00000184
-
-#define NV04_IMAGE_FROM_CPU_COLOR_KEY 0x00000184
-
-#define NV01_IMAGE_FROM_CPU_CLIP_RECTANGLE 0x00000188
-
-#define NV01_IMAGE_FROM_CPU_PATTERN 0x0000018c
-
-#define NV04_IMAGE_FROM_CPU_PATTERN 0x0000018c
-
-#define NV01_IMAGE_FROM_CPU_ROP 0x00000190
-
-#define NV01_IMAGE_FROM_CPU_BETA1 0x00000194
-
-
-#define NV01_IMAGE_FROM_CPU_SURFACE_DST 0x00000198
-
-
-#define NV04_IMAGE_FROM_CPU_BETA4 0x00000198
-
-#define NV04_IMAGE_FROM_CPU_SURFACE 0x0000019c
-
-#define NV05_IMAGE_FROM_CPU_COLOR_CONVERSION 0x000002f8
-
-#define NV01_IMAGE_FROM_CPU_OPERATION 0x000002fc
-#define NV01_IMAGE_FROM_CPU_OPERATION_SRCCOPY_AND 0x00000000
-#define NV01_IMAGE_FROM_CPU_OPERATION_ROP_AND 0x00000001
-#define NV01_IMAGE_FROM_CPU_OPERATION_BLEND_AND 0x00000002
-#define NV01_IMAGE_FROM_CPU_OPERATION_SRCCOPY 0x00000003
-#define NV01_IMAGE_FROM_CPU_OPERATION_SRCCOPY_PREMULT 0x00000004
-#define NV01_IMAGE_FROM_CPU_OPERATION_BLEND_PREMULT 0x00000005
-
-#define NV01_IMAGE_FROM_CPU_COLOR_FORMAT 0x00000300
-#define NV01_IMAGE_FROM_CPU_COLOR_FORMAT_R5G6G5 0x00000001
-#define NV01_IMAGE_FROM_CPU_COLOR_FORMAT_A1R5G5B5 0x00000002
-#define NV01_IMAGE_FROM_CPU_COLOR_FORMAT_X1R5G5B5 0x00000003
-#define NV01_IMAGE_FROM_CPU_COLOR_FORMAT_A8R8G8B8 0x00000004
-#define NV01_IMAGE_FROM_CPU_COLOR_FORMAT_X8R8G8B8 0x00000005
-
-#define NV01_IMAGE_FROM_CPU_POINT 0x00000304
-#define NV01_IMAGE_FROM_CPU_POINT_X__MASK 0x0000ffff
-#define NV01_IMAGE_FROM_CPU_POINT_X__SHIFT 0
-#define NV01_IMAGE_FROM_CPU_POINT_Y__MASK 0xffff0000
-#define NV01_IMAGE_FROM_CPU_POINT_Y__SHIFT 16
-
-#define NV01_IMAGE_FROM_CPU_SIZE_OUT 0x00000308
-#define NV01_IMAGE_FROM_CPU_SIZE_OUT_W__MASK 0x0000ffff
-#define NV01_IMAGE_FROM_CPU_SIZE_OUT_W__SHIFT 0
-#define NV01_IMAGE_FROM_CPU_SIZE_OUT_H__MASK 0xffff0000
-#define NV01_IMAGE_FROM_CPU_SIZE_OUT_H__SHIFT 16
-
-#define NV01_IMAGE_FROM_CPU_SIZE_IN 0x0000030c
-#define NV01_IMAGE_FROM_CPU_SIZE_IN_W__MASK 0x0000ffff
-#define NV01_IMAGE_FROM_CPU_SIZE_IN_W__SHIFT 0
-#define NV01_IMAGE_FROM_CPU_SIZE_IN_H__MASK 0xffff0000
-#define NV01_IMAGE_FROM_CPU_SIZE_IN_H__SHIFT 16
-
-#define NV01_IMAGE_FROM_CPU_COLOR(i0) (0x00000400 + 0x4*(i0))
-#define NV01_IMAGE_FROM_CPU_COLOR__ESIZE 0x00000004
-#define NV01_IMAGE_FROM_CPU_COLOR__LEN 0x00000020
-
-#define NV04_IMAGE_FROM_CPU_COLOR(i0) (0x00000400 + 0x4*(i0))
-#define NV04_IMAGE_FROM_CPU_COLOR__ESIZE 0x00000004
-#define NV04_IMAGE_FROM_CPU_COLOR__LEN 0x00000700
-
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_PATCH 0x0000010c
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_DMA_NOTIFY 0x00000180
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_COLOR_KEY 0x00000184
-
-#define NV04_STRETCHED_IMAGE_FROM_CPU_COLOR_KEY 0x00000184
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_PATTERN 0x00000188
-
-#define NV04_STRETCHED_IMAGE_FROM_CPU_PATTERN 0x00000188
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_ROP 0x0000018c
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_BETA1 0x00000190
-
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_SURFACE_DST 0x00000194
-
-
-#define NV04_STRETCHED_IMAGE_FROM_CPU_BETA4 0x00000194
-
-#define NV04_STRETCHED_IMAGE_FROM_CPU_SURFACE 0x00000198
-
-#define NV05_STRETCHED_IMAGE_FROM_CPU_COLOR_CONVERSION 0x000002f8
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_OPERATION 0x000002fc
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_COLOR_FORMAT 0x00000300
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_SIZE_IN 0x00000304
-#define NV03_STRETCHED_IMAGE_FROM_CPU_SIZE_IN_W__MASK 0x0000ffff
-#define NV03_STRETCHED_IMAGE_FROM_CPU_SIZE_IN_W__SHIFT 0
-#define NV03_STRETCHED_IMAGE_FROM_CPU_SIZE_IN_H__MASK 0xffff0000
-#define NV03_STRETCHED_IMAGE_FROM_CPU_SIZE_IN_H__SHIFT 16
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_DX_DU 0x00000308
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_DY_DV 0x0000030c
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_POINT 0x00000310
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_POINT_X__MASK 0x0000ffff
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_POINT_X__SHIFT 0
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_POINT_Y__MASK 0xffff0000
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_POINT_Y__SHIFT 16
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_SIZE 0x00000314
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_SIZE_W__MASK 0x0000ffff
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_SIZE_W__SHIFT 0
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_SIZE_H__MASK 0xffff0000
-#define NV03_STRETCHED_IMAGE_FROM_CPU_CLIP_SIZE_H__SHIFT 16
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_POINT12D4 0x00000318
-#define NV03_STRETCHED_IMAGE_FROM_CPU_POINT12D4_X__MASK 0x0000ffff
-#define NV03_STRETCHED_IMAGE_FROM_CPU_POINT12D4_X__SHIFT 0
-#define NV03_STRETCHED_IMAGE_FROM_CPU_POINT12D4_Y__MASK 0xffff0000
-#define NV03_STRETCHED_IMAGE_FROM_CPU_POINT12D4_Y__SHIFT 16
-
-#define NV03_STRETCHED_IMAGE_FROM_CPU_COLOR(i0) (0x00000400 + 0x4*(i0))
-#define NV03_STRETCHED_IMAGE_FROM_CPU_COLOR__ESIZE 0x00000004
-#define NV03_STRETCHED_IMAGE_FROM_CPU_COLOR__LEN 0x00000700
-
-
-#define NV10_SCALED_IMAGE_FROM_MEMORY_WAIT_FOR_IDLE 0x00000108
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_DMA_NOTIFY 0x00000180
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_DMA_IMAGE 0x00000184
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_PATTERN 0x00000188
-
-#define NV04_SCALED_IMAGE_FROM_MEMORY_PATTERN 0x00000188
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_ROP 0x0000018c
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_BETA1 0x00000190
-
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_SURFACE_DST 0x00000194
-
-
-#define NV04_SCALED_IMAGE_FROM_MEMORY_BETA4 0x00000194
-
-#define NV04_SCALED_IMAGE_FROM_MEMORY_SURFACE 0x00000198
-
-#define NV05_SCALED_IMAGE_FROM_MEMORY_SURFACE 0x00000198
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_CONVERSION 0x000002fc
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_CONVERSION_DITHER 0x00000000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_CONVERSION_TRUNCATE 0x00000001
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_CONVERSION_SUBTR_TRUNCATE 0x00000002
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT 0x00000300
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_A1R5G5B5 0x00000001
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_X1R5G5B5 0x00000002
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_A8R8G8B8 0x00000003
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_X8R8G8B8 0x00000004
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_V8YB8U8YA8 0x00000005
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_YB8V8YA8U8 0x00000006
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_R5G6B5 0x00000007
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_Y8 0x00000008
-#define NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_AY8 0x00000009
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION 0x00000304
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION_SRCCOPY_AND 0x00000000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION_ROP_AND 0x00000001
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION_BLEND_AND 0x00000002
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION_SRCCOPY 0x00000003
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION_SRCCOPY_PREMULT 0x00000004
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION_BLEND_PREMULT 0x00000005
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_POINT 0x00000308
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_POINT_X__MASK 0x0000ffff
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_POINT_X__SHIFT 0
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_POINT_Y__MASK 0xffff0000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_POINT_Y__SHIFT 16
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_SIZE 0x0000030c
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_SIZE_W__MASK 0x0000ffff
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_SIZE_W__SHIFT 0
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_SIZE_H__MASK 0xffff0000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_SIZE_H__SHIFT 16
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_POINT 0x00000310
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_POINT_X__MASK 0x0000ffff
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_POINT_X__SHIFT 0
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_POINT_Y__MASK 0xffff0000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_POINT_Y__SHIFT 16
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_SIZE 0x00000314
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_SIZE_W__MASK 0x0000ffff
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_SIZE_W__SHIFT 0
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_SIZE_H__MASK 0xffff0000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OUT_SIZE_H__SHIFT 16
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_DU_DX 0x00000318
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_DV_DY 0x0000031c
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_SIZE 0x00000400
-#define NV03_SCALED_IMAGE_FROM_MEMORY_SIZE_W__MASK 0x0000ffff
-#define NV03_SCALED_IMAGE_FROM_MEMORY_SIZE_W__SHIFT 0
-#define NV03_SCALED_IMAGE_FROM_MEMORY_SIZE_H__MASK 0xffff0000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_SIZE_H__SHIFT 16
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT 0x00000404
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_PITCH__MASK 0x0000ffff
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_PITCH__SHIFT 0
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_ORIGIN__MASK 0x00ff0000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_ORIGIN__SHIFT 16
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_ORIGIN_CENTER 0x00010000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_ORIGIN_CORNER 0x00020000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_FILTER__MASK 0xff000000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_FILTER__SHIFT 24
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_FILTER_POINT_SAMPLE 0x00000000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_FILTER_BILINEAR 0x01000000
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_OFFSET 0x00000408
-
-#define NV03_SCALED_IMAGE_FROM_MEMORY_POINT 0x0000040c
-#define NV03_SCALED_IMAGE_FROM_MEMORY_POINT_U__MASK 0x0000ffff
-#define NV03_SCALED_IMAGE_FROM_MEMORY_POINT_U__SHIFT 0
-#define NV03_SCALED_IMAGE_FROM_MEMORY_POINT_V__MASK 0xffff0000
-#define NV03_SCALED_IMAGE_FROM_MEMORY_POINT_V__SHIFT 16
-
-
-#define NV50_SCALED_IMAGE_FROM_MEMORY_OFFSET_HIGH 0x00000410
-
-#define NV50_SCALED_IMAGE_FROM_MEMORY_SRC_LINEAR 0x00000414
-
-#define NV50_SCALED_IMAGE_FROM_MEMORY_SRC_TILE_MODE 0x00000418
-
-
-#define NV03_GDI_RECTANGLE_TEXT_DMA_NOTIFY 0x00000180
-
-#define NV03_GDI_RECTANGLE_TEXT_PATTERN 0x00000184
-
-#define NV03_GDI_RECTANGLE_TEXT_ROP 0x00000188
-
-#define NV03_GDI_RECTANGLE_TEXT_BETA1 0x0000019c
-
-#define NV03_GDI_RECTANGLE_TEXT_SURFACE_DST 0x00000190
-
-#define NV03_GDI_RECTANGLE_TEXT_OPERATION 0x000002fc
-
-#define NV03_GDI_RECTANGLE_TEXT_COLOR_FORMAT 0x00000300
-
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_FORMAT 0x00000304
-
-#define NV03_GDI_RECTANGLE_TEXT_COLOR1_A 0x000003fc
-
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT 0x00000400
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_Y__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_Y__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_X__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_X__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE 0x00000404
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_H__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_H__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_W__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_W__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT0_B 0x000007f4
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT0_B_L__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT0_B_L__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT0_B_T__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT0_B_T__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT1_B 0x000007f8
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT1_B_R__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT1_B_R__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT1_B_B__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_POINT1_B_B__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_COLOR1_B 0x000007fc
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0 0x00000800
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_L__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_L__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_T__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_T__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1 0x00000804
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_R__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_R__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_B__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_B__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT0 0x00000bec
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_L__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_L__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_T__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_T__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT1 0x00000bf0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_R__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_R__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_B__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_B__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_COLOR1_C 0x00000bf4
-
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_C 0x00000bf8
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_C_W__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_C_W__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_C_H__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_C_H__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_POINT_C 0x00000bfc
-#define NV03_GDI_RECTANGLE_TEXT_POINT_C_X__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_POINT_C_X__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_POINT_C_Y__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_POINT_C_Y__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_C(i0) (0x00000c00 + 0x4*(i0))
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_C__ESIZE 0x00000004
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_C__LEN 0x00000020
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT0 0x00000fe8
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT0_L__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT0_L__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT0_T__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT0_T__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT1 0x00000fec
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT1_R__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT1_R__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT1_B__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_D_POINT1_B__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_COLOR1_D 0x00000ff0
-
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_D 0x00000ff4
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_D_W__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_D_W__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_D_H__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_D_H__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_D 0x00000ff8
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_D_W__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_D_W__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_D_H__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_D_H__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_POINT_D 0x00000ffc
-#define NV03_GDI_RECTANGLE_TEXT_POINT_D_X__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_POINT_D_X__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_POINT_D_Y__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_POINT_D_Y__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_D(i0) (0x00001000 + 0x4*(i0))
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_D__ESIZE 0x00000004
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_D__LEN 0x00000020
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT0 0x000013e4
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_L__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_L__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_T__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_T__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT1 0x000013e8
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_R__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_R__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_B__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_B__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_COLOR0_E 0x000013ec
-
-#define NV03_GDI_RECTANGLE_TEXT_COLOR1_E 0x000013f0
-
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_E 0x000013f4
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_E_W__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_E_W__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_E_H__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_IN_E_H__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_E 0x000013f8
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_E_W__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_E_W__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_E_H__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_SIZE_OUT_E_H__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_POINT_E 0x000013fc
-#define NV03_GDI_RECTANGLE_TEXT_POINT_E_X__MASK 0x0000ffff
-#define NV03_GDI_RECTANGLE_TEXT_POINT_E_X__SHIFT 0
-#define NV03_GDI_RECTANGLE_TEXT_POINT_E_Y__MASK 0xffff0000
-#define NV03_GDI_RECTANGLE_TEXT_POINT_E_Y__SHIFT 16
-
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR01_E(i0) (0x00001400 + 0x4*(i0))
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR01_E__ESIZE 0x00000004
-#define NV03_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR01_E__LEN 0x00000020
-
-
-#define NV04_GDI_RECTANGLE_TEXT_PATCH 0x0000010c
-
-#define NV04_GDI_RECTANGLE_TEXT_DMA_NOTIFY 0x00000180
-
-#define NV04_GDI_RECTANGLE_TEXT_DMA_FONTS 0x00000184
-
-#define NV04_GDI_RECTANGLE_TEXT_PATTERN 0x00000188
-
-#define NV04_GDI_RECTANGLE_TEXT_ROP 0x0000018c
-
-#define NV04_GDI_RECTANGLE_TEXT_BETA1 0x00000190
-
-#define NV04_GDI_RECTANGLE_TEXT_BETA4 0x00000194
-
-#define NV04_GDI_RECTANGLE_TEXT_SURFACE 0x00000198
-
-#define NV04_GDI_RECTANGLE_TEXT_OPERATION 0x000002fc
-#define NV04_GDI_RECTANGLE_TEXT_OPERATION_SRCCOPY_AND 0x00000000
-#define NV04_GDI_RECTANGLE_TEXT_OPERATION_ROP_AND 0x00000001
-#define NV04_GDI_RECTANGLE_TEXT_OPERATION_BLEND_AND 0x00000002
-#define NV04_GDI_RECTANGLE_TEXT_OPERATION_SRCCOPY 0x00000003
-#define NV04_GDI_RECTANGLE_TEXT_OPERATION_SRCCOPY_PREMULT 0x00000004
-#define NV04_GDI_RECTANGLE_TEXT_OPERATION_BLEND_PREMULT 0x00000005
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT 0x00000300
-#define NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT_A16R5G6B5 0x00000001
-#define NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT_X16A1R5G5B5 0x00000002
-#define NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT_A8R8G8B8 0x00000003
-
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_FORMAT 0x00000304
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_FORMAT_CGA6 0x00000001
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_FORMAT_LE 0x00000002
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR1_A 0x000003fc
-
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT(i0) (0x00000400 + 0x8*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT__ESIZE 0x00000008
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT__LEN 0x00000020
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_Y__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_Y__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_X__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT_X__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE(i0) (0x00000404 + 0x8*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE__ESIZE 0x00000008
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE__LEN 0x00000020
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_H__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_H__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_W__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_SIZE_W__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT0 0x000005f4
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT0_L__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT0_L__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT0_T__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT0_T__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT1 0x000005f8
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT1_R__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT1_R__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT1_B__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_B_POINT1_B__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR1_B 0x000005fc
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0(i0) (0x00000600 + 0x8*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0__ESIZE 0x00000008
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0__LEN 0x00000020
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_L__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_L__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_T__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_0_T__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1(i0) (0x00000604 + 0x8*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1__ESIZE 0x00000008
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1__LEN 0x00000020
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_R__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_R__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_B__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIPPED_RECTANGLE_POINT_1_B__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT0 0x000007ec
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_L__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_L__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_T__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT0_T__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT1 0x000007f0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_R__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_R__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_B__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_C_POINT1_B__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR1_C 0x000007f4
-
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_C 0x000007f8
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_C_W__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_C_W__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_C_H__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_C_H__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_POINT_C 0x000007fc
-#define NV04_GDI_RECTANGLE_TEXT_POINT_C_X__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_POINT_C_X__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_POINT_C_Y__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_POINT_C_Y__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_C(i0) (0x00000800 + 0x4*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_C__ESIZE 0x00000004
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR1_C__LEN 0x00000080
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT0 0x00000be4
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_L__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_L__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_T__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT0_T__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT1 0x00000be8
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_R__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_R__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_B__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_E_POINT1_B__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR0_E 0x00000bec
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR1_E 0x00000bf0
-
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_IN_E 0x00000bf4
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_IN_E_W__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_IN_E_W__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_IN_E_H__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_IN_E_H__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_OUT_E 0x00000bf8
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_OUT_E_W__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_OUT_E_W__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_OUT_E_H__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_SIZE_OUT_E_H__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_POINT_E 0x00000bfc
-#define NV04_GDI_RECTANGLE_TEXT_POINT_E_X__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_POINT_E_X__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_POINT_E_Y__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_POINT_E_Y__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR01_E(i0) (0x00000c00 + 0x4*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR01_E__ESIZE 0x00000004
-#define NV04_GDI_RECTANGLE_TEXT_MONOCHROME_COLOR01_E__LEN 0x00000080
-
-#define NV04_GDI_RECTANGLE_TEXT_FONT_F 0x00000ff0
-#define NV04_GDI_RECTANGLE_TEXT_FONT_F_OFFSET__MASK 0x0fffffff
-#define NV04_GDI_RECTANGLE_TEXT_FONT_F_OFFSET__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_FONT_F_PITCH__MASK 0xf0000000
-#define NV04_GDI_RECTANGLE_TEXT_FONT_F_PITCH__SHIFT 28
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT0 0x00000ff4
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT0_L__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT0_L__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT0_T__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT0_T__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT1 0x00000ff8
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT1_R__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT1_R__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT1_B__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_F_POINT1_B__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR1_F 0x00000ffc
-
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F(i0) (0x00001000 + 0x4*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F__ESIZE 0x00000004
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F__LEN 0x00000100
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F_INDEX__MASK 0x000000ff
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F_INDEX__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F_X__MASK 0x000fff00
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F_X__SHIFT 8
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F_Y__MASK 0xfff00000
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_F_Y__SHIFT 20
-
-#define NV04_GDI_RECTANGLE_TEXT_FONT_G 0x000017f0
-#define NV04_GDI_RECTANGLE_TEXT_FONT_G_OFFSET__MASK 0x0fffffff
-#define NV04_GDI_RECTANGLE_TEXT_FONT_G_OFFSET__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_FONT_G_PITCH__MASK 0xf0000000
-#define NV04_GDI_RECTANGLE_TEXT_FONT_G_PITCH__SHIFT 28
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT0 0x000017f4
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT0_L__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT0_L__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT0_T__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT0_T__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT1 0x000017f8
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT1_R__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT1_R__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT1_B__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CLIP_G_POINT1_B__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_COLOR1_G 0x000017fc
-
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_POINT(i0) (0x00001800 + 0x8*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_POINT__ESIZE 0x00000008
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_POINT__LEN 0x00000100
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_POINT_X__MASK 0x0000ffff
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_POINT_X__SHIFT 0
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_POINT_Y__MASK 0xffff0000
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_POINT_Y__SHIFT 16
-
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_INDEX(i0) (0x00001804 + 0x8*(i0))
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_INDEX__ESIZE 0x00000008
-#define NV04_GDI_RECTANGLE_TEXT_CHARACTER_COLOR1_G_INDEX__LEN 0x00000100
-
-
-#define NV10_TEXTURE_FROM_CPU_WAIT_FOR_IDLE 0x00000108
-
-#define NV10_TEXTURE_FROM_CPU_DMA_NOTIFY 0x00000180
-
-#define NV10_TEXTURE_FROM_CPU_SURFACE 0x00000184
-
-#define NV10_TEXTURE_FROM_CPU_COLOR_FORMAT 0x00000300
-
-#define NV10_TEXTURE_FROM_CPU_POINT 0x00000304
-#define NV10_TEXTURE_FROM_CPU_POINT_X__MASK 0x0000ffff
-#define NV10_TEXTURE_FROM_CPU_POINT_X__SHIFT 0
-#define NV10_TEXTURE_FROM_CPU_POINT_Y__MASK 0xffff0000
-#define NV10_TEXTURE_FROM_CPU_POINT_Y__SHIFT 16
-
-#define NV10_TEXTURE_FROM_CPU_SIZE 0x00000308
-#define NV10_TEXTURE_FROM_CPU_SIZE_W__MASK 0x0000ffff
-#define NV10_TEXTURE_FROM_CPU_SIZE_W__SHIFT 0
-#define NV10_TEXTURE_FROM_CPU_SIZE_H__MASK 0xffff0000
-#define NV10_TEXTURE_FROM_CPU_SIZE_H__SHIFT 16
-
-#define NV10_TEXTURE_FROM_CPU_CLIP_HORIZONTAL 0x0000030c
-#define NV10_TEXTURE_FROM_CPU_CLIP_HORIZONTAL_X__MASK 0x0000ffff
-#define NV10_TEXTURE_FROM_CPU_CLIP_HORIZONTAL_X__SHIFT 0
-#define NV10_TEXTURE_FROM_CPU_CLIP_HORIZONTAL_W__MASK 0xffff0000
-#define NV10_TEXTURE_FROM_CPU_CLIP_HORIZONTAL_W__SHIFT 16
-
-#define NV10_TEXTURE_FROM_CPU_CLIP_VERTICAL 0x00000310
-#define NV10_TEXTURE_FROM_CPU_CLIP_VERTICAL_Y__MASK 0x0000ffff
-#define NV10_TEXTURE_FROM_CPU_CLIP_VERTICAL_Y__SHIFT 0
-#define NV10_TEXTURE_FROM_CPU_CLIP_VERTICAL_H__MASK 0xffff0000
-#define NV10_TEXTURE_FROM_CPU_CLIP_VERTICAL_H__SHIFT 16
-
-#define NV10_TEXTURE_FROM_CPU_COLOR(i0) (0x00000400 + 0x4*(i0))
-#define NV10_TEXTURE_FROM_CPU_COLOR__ESIZE 0x00000004
-#define NV10_TEXTURE_FROM_CPU_COLOR__LEN 0x00000700
-
-
-#endif /* NV01_2D_XML */
+++ /dev/null
-/**************************************************************************
- *
- * Copyright 2009 Ben Skeggs
- * Copyright 2009 Younes Manton
- * Copyright 2010 Luca Barbieri
- * All Rights Reserved.
- *
- * Permission is hereby granted, free of charge, to any person obtaining
- * a copy of this software and associated documentation files (the
- * "Software"), to deal in the Software without restriction, including
- * without limitation the rights to use, copy, modify, merge, publish,
- * distribute, sub license, and/or sell copies of the Software, and to
- * permit persons to whom the Software is furnished to do so, subject to
- * the following conditions:
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
- * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
- * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
- * USE OR OTHER DEALINGS IN THE SOFTWARE.
- *
- * The above copyright notice and this permission notice (including the
- * next paragraph) shall be included in all copies or substantial portions
- * of the Software.
- *
- **************************************************************************/
-
-/* this code has no Mesa or Gallium dependency and can be reused in the classic Mesa driver or DDX */
-
-#include <stdlib.h>
-#include <stdio.h>
-#include <stdint.h>
-#include <nouveau/nouveau_device.h>
-#include <nouveau/nouveau_channel.h>
-#include <nouveau/nouveau_bo.h>
-#include <nouveau/nouveau_notifier.h>
-#include <nouveau/nouveau_grobj.h>
-#include <nouveau/nv04_pushbuf.h>
-#include "nv04_2d.h"
-
-#include "nouveau/nv_object.xml.h"
-#include "nouveau/nv_m2mf.xml.h"
-#include "nv01_2d.xml.h"
-
-/* avoid depending on Mesa/Gallium */
-#ifdef __GNUC__
-#define likely(x) __builtin_expect(!!(x), 1)
-#define unlikely(x) __builtin_expect(!!(x), 0)
-#else
-#define likely(x) !!(x)
-#define unlikely(x) !!(x)
-#endif
-
-#define MIN2( A, B ) ( (A)<(B) ? (A) : (B) )
-#define MAX2( A, B ) ( (A)>(B) ? (A) : (B) )
-
-struct nv04_2d_context
-{
- struct nouveau_notifier *ntfy;
- struct nouveau_grobj *surf2d;
- struct nouveau_grobj *swzsurf;
- struct nouveau_grobj *m2mf;
- struct nouveau_grobj *rect;
- struct nouveau_grobj *sifm;
- struct nouveau_grobj *blit;
-};
-
-static inline int
-align(int value, int alignment)
-{
- return (value + alignment - 1) & ~(alignment - 1);
-}
-
-static inline int
-util_is_pot(unsigned x)
-{
- return (x & (x - 1)) == 0;
-}
-
-/* Integer base-2 logarithm, rounded towards zero. */
-static inline unsigned log2i(unsigned i)
-{
- unsigned r = 0;
-
- if (i & 0xffff0000) {
- i >>= 16;
- r += 16;
- }
- if (i & 0x0000ff00) {
- i >>= 8;
- r += 8;
- }
- if (i & 0x000000f0) {
- i >>= 4;
- r += 4;
- }
- if (i & 0x0000000c) {
- i >>= 2;
- r += 2;
- }
- if (i & 0x00000002) {
- r += 1;
- }
- return r;
-}
-
-//#define NV04_REGION_DEBUG
-
-// Yes, we really want to inline everything, since all the functions are used only once
-#if defined(__GNUC__) && !defined(DEBUG)
-#define inline __attribute__((always_inline)) inline
-#endif
-
-static inline unsigned
-nv04_swizzle_bits_square(unsigned x, unsigned y)
-{
- unsigned u = (x & 0x001) << 0 |
- (x & 0x002) << 1 |
- (x & 0x004) << 2 |
- (x & 0x008) << 3 |
- (x & 0x010) << 4 |
- (x & 0x020) << 5 |
- (x & 0x040) << 6 |
- (x & 0x080) << 7 |
- (x & 0x100) << 8 |
- (x & 0x200) << 9 |
- (x & 0x400) << 10 |
- (x & 0x800) << 11;
-
- unsigned v = (y & 0x001) << 1 |
- (y & 0x002) << 2 |
- (y & 0x004) << 3 |
- (y & 0x008) << 4 |
- (y & 0x010) << 5 |
- (y & 0x020) << 6 |
- (y & 0x040) << 7 |
- (y & 0x080) << 8 |
- (y & 0x100) << 9 |
- (y & 0x200) << 10 |
- (y & 0x400) << 11 |
- (y & 0x800) << 12;
- return v | u;
-}
-
-/* rectangular swizzled textures are linear concatenations of swizzled square tiles */
-static inline unsigned
-nv04_swizzle_bits_2d(unsigned x, unsigned y, unsigned w, unsigned h)
-{
- if(h <= 1)
- return x;
- else
- {
- unsigned s = MIN2(w, h);
- unsigned m = s - 1;
- return (((x | y) & ~m) * s) | nv04_swizzle_bits_square(x & m, y & m);
- }
-}
-
-// general 3D texture case
-static inline unsigned
-nv04_swizzle_bits(unsigned x, unsigned y, unsigned z, unsigned w, unsigned h, unsigned d)
-{
- if(d <= 1)
- return nv04_swizzle_bits_2d(x, y, w, h);
- else
- {
- // TODO: autogenerate code for all possible texture sizes (13 * 13 * 13 with dims <= 4096) and do a single indirect call
- unsigned v = 0;
- w >>= 1;
- h >>= 1;
- d >>= 1;
- for(int i = 0;;)
- {
- int oldi = i;
- if(likely(w))
- {
- v |= (x & 1) << i;
- x >>= 1;
- w >>= 1;
- ++i;
- }
-
- if(likely(h))
- {
- v |= (y & 1) << i;
- y >>= 1;
- h >>= 1;
- ++i;
- }
-
- if(likely(d))
- {
- v |= (z & 1) << i;
- z >>= 1;
- d >>= 1;
- ++i;
- }
-
- if(i == oldi)
- break;
- }
- return v;
- }
-}
-
-unsigned
-nv04_region_begin(struct nv04_region* rgn, unsigned w, unsigned h)
-{
- if(rgn->pitch)
- return rgn->pitch * rgn->y + (rgn->x << rgn->bpps);
- else
- return nv04_swizzle_bits(rgn->x, rgn->y, rgn->z, rgn->w, rgn->h, rgn->d) << rgn->bpps;
-}
-
-unsigned
-nv04_region_end(struct nv04_region* rgn, unsigned w, unsigned h)
-{
- if(rgn->pitch)
- return rgn->pitch * (rgn->y + h - 1) + ((rgn->x + w) << rgn->bpps);
- else
- return (nv04_swizzle_bits(rgn->x + w - 1, rgn->y + h - 1, rgn->z, rgn->w, rgn->h, rgn->d) + 1) << rgn->bpps;
-}
-
-// *pitch = -1 -> use 3D swizzling for (x, y), *pitch = 0 -> use 2D swizzling, other *pitch -> use linear calculations
-// returns 2 if pixel order is 3D-swizzled and 1 if subrect is 2D-swizzled
-/* *pitch == -1 ret = 0 -> 3D swizzled subrect
- * *pitch == 0 ret = 0 -> 2D swizzled subrect
- * *pitch > 0 ret = 0 -> linear subrect
- * *pitch > 0 ret = 1 -> linear subrect, but with swizzled 3D data inside
- */
-
-static inline void
-nv04_region_print(struct nv04_region* rgn)
-{
- fprintf(stderr, "<%i[%i]> ", rgn->bo->handle, rgn->offset);
- if(rgn->pitch)
- fprintf(stderr, "lin %i", rgn->pitch);
- else
- fprintf(stderr, "swz %ix%ix%i", rgn->w, rgn->h, rgn->d);
- fprintf(stderr, " (%i, %i, %i)", rgn->x, rgn->y, rgn->z);
-}
-
-static inline void
-nv04_region_assert(struct nv04_region* rgn, unsigned w, unsigned h)
-{
- unsigned end = rgn->offset + nv04_region_end(rgn, w, h);
-
- assert(rgn->offset <= (int)rgn->bo->size);
- assert(end <= rgn->bo->size);
- (void) end;
- if(!rgn->pitch) {
- assert(util_is_pot(rgn->w));
- assert(util_is_pot(rgn->h));
- }
-}
-
-/* determine if region can be linearized or fake-linearized */
-static inline int
-nv04_region_is_contiguous(struct nv04_region* rgn, int w, int h)
-{
- int surf_min;
- int rect_min;
-
- if(rgn->pitch)
- return rgn->pitch == w << rgn->bpps;
-
- // redundant, but this is the fast path for the common case
- if(w == rgn->w && h == rgn->h && rgn->d <= 1)
- return 1;
-
- // must be POT
- if((w & (w - 1)) || (h & (h - 1)))
- return 0;
-
- // must be aligned
- if((rgn->x & (w - 1)) || (rgn->y & (h - 1)))
- return 0;
-
- if(rgn->d > 1)
- return 0;
-
- surf_min = MIN2(rgn->w, rgn->h);
- rect_min = MIN2(w, h);
-
- if((rect_min == surf_min) || (w == h) || (w == 2 * h))
- return 1;
-
- return 0;
-}
-
-// double the pitch until it is larger than the alignment, or the height becomes odd or 1
-static inline void
-nv04_region_contiguous_shape(struct nv04_region* rgn, int* w, int* h, int align)
-{
- while(!(*h & 1) && (*w << rgn->bpps) < (1 << align))
- {
- *w <<= 1;
- *h >>= 1;
- }
-
- while((*w << rgn->bpps) > 16384 && !(*w & 1))
- {
- *w >>= 1;
- *h <<= 1;
- }
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tCONTIGUOUS %ix%i\n", *w, *h);
-#endif
-}
-
-static inline void
-nv04_region_linearize_contiguous(struct nv04_region* rgn, unsigned w, unsigned h)
-{
- int pos;
- if(rgn->pitch)
- {
- rgn->offset += rgn->y * rgn->pitch + (rgn->x << rgn->bpps);
- rgn->x = 0;
- rgn->y = 0;
- }
- else
- {
- rgn->offset += (rgn->w * rgn->h * rgn->z) << rgn->bpps;
- pos = nv04_swizzle_bits(rgn->x, rgn->y, rgn->z, rgn->w, rgn->h, rgn->d);
- rgn->x = pos & (w - 1);
- rgn->y = pos / w;
- }
- rgn->pitch = w << rgn->bpps;
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tLINEARIZE ");
- nv04_region_print(rgn);
- fprintf(stderr, "\n");
-#endif
-}
-
- /* preserve the offset! */
- /*
- rgn->pitch = util_format_get_stride(rgn->format, w);
- int pos = nv04_swizzle_bits(rgn->x, rgn->y, rgn->z, rgn->w, rgn->h, rgn->d);
- rgn->x = pos & (w - 1);
- rgn->y = pos & ~(w - 1);
- */
-
- /*
- rgn->offset +=
- rgn->pitch = util_format_get_stride(rgn->format, w);
- rgn->x = 0;
- rgn->y = 0;
- */
-
-/* This code will get used for, and always succeed on:
- * - 4x2 1bpp swizzled texture mipmap levels
- * - linear regions created by linearization
- *
- * This code will get used for, and MAY work for:
- * - misaligned texture blanket
- * - linear surfaces created without wide_pitch (in this case, it will only work if we are lucky)
- *
- * The general case requires splitting the region in 2.
- */
-static inline int
-nv04_region_do_align_offset(struct nv04_region* rgn, unsigned w, unsigned h, int shift)
-{
- if(rgn->pitch > 0)
- {
- assert(!(rgn->offset & ((1 << rgn->bpps) - 1))); // fatal!
-
- if(h <= 1)
- {
- int delta;
- rgn->offset += rgn->y * rgn->pitch + (rgn->x << rgn->bpps);
- delta = rgn->offset & ((1 << shift) - 1);
- rgn->y = 0;
- rgn->x = delta >> rgn->bpps;
- rgn->offset -= delta;
- rgn->pitch = align((rgn->x + w) << rgn->bpps, 1 << shift);
- }
- else
- {
- int delta = rgn->offset & ((1 << shift) - 1);
- int newxo = (rgn->x << rgn->bpps) + delta;
- int dy = newxo / rgn->pitch;
- newxo -= dy * rgn->pitch;
- if((newxo + (w << rgn->bpps)) > rgn->pitch)
- {
- // TODO: split the region into two rectangles (!) if *really* necessary, unless the hardware actually supports "wrapping" rectangles
- // this does not happen if the surface is pitch-aligned, which it should always be
- assert(0);
- return -1;
- }
- rgn->x = newxo >> rgn->bpps;
- rgn->y += dy;
- }
- }
- else
- {
- int size;
- int min;
- int v;
-
- // we don't care about the alignment of 3D surfaces since the 2D engine can't use them
- if(rgn->d < 0)
- return -1;
-
- min = MIN2(rgn->w, rgn->h);
- size = min * min << rgn->bpps;
-
- // this is unfixable, and should not be happening
- if(rgn->offset & (size - 1))
- return -1;
-
- v = (rgn->offset & ((1 << shift) - 1)) / size;
- rgn->offset -= v * size;
-
- if(rgn->h == min)
- {
- unsigned w;
- rgn->x += rgn->h * v;
- w = rgn->w + rgn->h * v;
-
- while(rgn->w < w)
- rgn->w += rgn->w;
- }
- else
- {
- unsigned h;
- rgn->y += rgn->w * v;
- h = rgn->h + rgn->w * v;
-
- while(rgn->h < h)
- rgn->h += rgn->h;
- }
- }
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tALIGNED ");
- nv04_region_print(rgn);
- fprintf(stderr, "\n");
-#endif
- return 0;
-}
-
-// both pitch and shift
-// will leave the region unchanged if it fails
-static inline int
-nv04_region_align(struct nv04_region* rgn, unsigned w, unsigned h, int shift)
-{
- if(rgn->pitch & ((1 << shift) - 1))
- {
- if(h == 1)
- goto do_align; /* this will fix pitch too in this case */
- else
- return -1;
- }
-
- if(rgn->offset & ((1 << shift) - 1))
- {
- do_align:
- if(nv04_region_do_align_offset(rgn, w, h, shift))
- return -1;
- }
- return 0;
-}
-
-/* this contains 22 different copy loops after preprocessing. unfortunately, it's necessary */
-void
-nv04_region_copy_cpu(struct nv04_region* dst, struct nv04_region* src, int w, int h)
-{
- uint8_t* mdst;
- uint8_t* msrc;
- int size;
-
- if(dst->bo != src->bo)
- {
- nouveau_bo_map(dst->bo, NOUVEAU_BO_WR);
- nouveau_bo_map(src->bo, NOUVEAU_BO_RD);
- }
- else
- nouveau_bo_map(dst->bo, NOUVEAU_BO_WR | NOUVEAU_BO_RD);
-
- mdst = (uint8_t*)dst->bo->map + dst->offset;
- msrc = (uint8_t*)src->bo->map + src->offset;
-
- size = w << dst->bpps;
-
- nv04_region_assert(dst, w, h);
- nv04_region_assert(src, w, h);
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tRGN_COPY_CPU [%i, %i: %i] ", w, h, dst->bpps);
- for(int i = 0; i < 2; ++i)
- {
- nv04_region_print(i ? src : dst);
- fprintf(stderr, i ? "\n" : " <- ");
- }
-
-// for(int i = 0; i < 16; ++i)
-// fprintf(stderr, "%02x ", msrc[i]);
-// fprintf(stderr, "\n");
-#endif
-
- // TODO: support overlapping copies!
- if(src->pitch && dst->pitch)
- {
- mdst += dst->y * dst->pitch + (dst->x << dst->bpps);
- msrc += src->y * src->pitch + (src->x << src->bpps);
- if(dst->bo != src->bo)
- goto simple;
- else if(mdst < msrc)
- {
- if(mdst + size <= msrc)
- {
-simple:
- for(int iy = 0; iy < h; ++iy)
- {
- assert(mdst + size <= (uint8_t*)dst->bo->map + dst->bo->size);
- assert(msrc + size <= (uint8_t*)src->bo->map + src->bo->size);
- memcpy(mdst, msrc, size);
- msrc += src->pitch; mdst += dst->pitch;
- }
- }
- else
- {
- for(int iy = 0; iy < h; ++iy)
- {
- assert(mdst + size <= (uint8_t*)dst->bo->map + dst->bo->size);
- assert(msrc + size <= (uint8_t*)src->bo->map + src->bo->size);
- memmove(mdst, msrc, size);
- msrc += src->pitch; mdst += dst->pitch;
- }
- }
- }
- else
- {
- /* copy backwards so we don't destroy data we have to read yet */
- if(msrc + size <= mdst)
- {
- for(int iy = h - 1; iy >= 0; --iy)
- {
- assert(mdst + size <= (uint8_t*)dst->bo->map + dst->bo->size);
- assert(msrc + size <= (uint8_t*)src->bo->map + src->bo->size);
- memcpy(mdst, msrc, size);
- msrc += src->pitch; mdst += dst->pitch;
- }
- }
- else
- {
- for(int iy = h - 1; iy >= 0; --iy)
- {
- assert(mdst + size <= (uint8_t*)dst->bo->map + dst->bo->size);
- assert(msrc + size <= (uint8_t*)src->bo->map + src->bo->size);
- memmove(mdst, msrc, size);
- msrc += src->pitch; mdst += dst->pitch;
- }
- }
- }
- }
- else
- {
- int* dswx = NULL;
- int* dswy = NULL;
- int* sswx = NULL;
- int* sswy = NULL;
- int dir;
-
- if(!dst->pitch)
- {
- dswx = alloca(w * sizeof(int));
- for(int ix = 0; ix < w; ++ix) // we are adding, so z cannot be contributed by both
- dswx[ix] = nv04_swizzle_bits(dst->x + ix, 0, 0, dst->w, dst->h, dst->d);
- dswy = alloca(h * sizeof(int));
- for(int iy = 0; iy < h; ++iy)
- dswy[iy] = nv04_swizzle_bits(0, dst->y + iy, dst->z, dst->w, dst->h, dst->d);
- }
-
- if(!src->pitch)
- {
- sswx = alloca(w * sizeof(int));
- for(int ix = 0; ix < w; ++ix)
- sswx[ix] = nv04_swizzle_bits(src->x + ix, 0, 0, src->w, src->h, src->d);
- sswy = alloca(h * sizeof(int));
- for(int iy = 0; iy < h; ++iy)
- sswy[iy] = nv04_swizzle_bits(0, src->y + iy, src->z, src->w, src->h, src->d);
- }
-
- dir = 1;
- /* do backwards copies for overlapping swizzled surfaces */
- if(dst->pitch == src->pitch && dst->offset == src->offset)
- {
- if(dst->y > src->y || (dst->y == src->y && dst->x > src->x))
- dir = -1;
- }
-
-#define SWIZZLED_COPY_LOOPS
- if(dir == 1)
- {
- int dir = 1;
-#define LOOP_Y for(int iy = 0; iy < h; ++iy)
-#define LOOP_X for(int ix = 0; ix < w; ++ix)
-#include "nv04_2d_loops.h"
-#undef LOOP_X
-#undef LOOP_Y
- }
- else
- {
- int dir = -1;
-#define LOOP_Y for(int iy = h - 1; iy >= 0; --iy)
-#define LOOP_X for(int ix = w - 1; ix >= 0; --ix)
-#include "nv04_2d_loops.h"
-#undef LOOP_X
-#undef LOOP_Y
- }
-#undef SWIZZLED_COPY_LOOP
- }
-
- if(src->bo != dst->bo)
- nouveau_bo_unmap(src->bo);
- nouveau_bo_unmap(dst->bo);
-}
-
-/* TODO: if the destination is swizzled, we are doing random writes, which causes write combining to fail
- * the alternative is to read, modify and copy back, which may or may not be faster
- * loading 3D textures is a common case that hits this and could probably benefit from the temporary
- */
-void
-nv04_region_fill_cpu(struct nv04_region* dst, int w, int h, unsigned value)
-{
- uint8_t* mdst = (nouveau_bo_map(dst->bo, NOUVEAU_BO_WR), (uint8_t*)dst->bo->map + dst->offset);
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tRGN_FILL_CPU ");
- nv04_region_print(dst);
- fprintf(stderr, "\n");
-#endif
-
- nv04_region_assert(dst, w, h);
-
- if(dst->pitch)
- {
- unsigned size = w << dst->bpps;
-
-#define FILL(T) do { \
- for(int iy = 0; iy < h; ++iy) \
- { \
- assert((char*)((T*)mdst + w) <= (char*)dst->bo->map + dst->bo->size); \
- for(int ix = 0; ix < w; ++ix) \
- ((T*)mdst)[ix] = (T)value; \
- mdst += dst->pitch; \
- } \
- } while(0)
-
- mdst += dst->y * dst->pitch + (dst->x << dst->bpps);
-
- if(dst->bpps == 0)
- {
-ms:
- assert(mdst + size * h <= (uint8_t*)dst->bo->map + dst->bo->size);
- if(size == dst->pitch)
- memset(mdst, (uint8_t)value, size * h);
- else
- {
- for(int iy = 0; iy < h; ++iy)
- {
- assert(mdst + size <= (uint8_t*)dst->bo->map + dst->bo->size);
- memset(mdst, (uint8_t)value, size);
- mdst += dst->pitch;
- }
- }
- }
- else if(dst->bpps == 1)
- {
- if(!((uint8_t)value ^ (uint8_t)(value >> 8)))
- goto ms;
-
- FILL(uint16_t);
- }
- else if(dst->bpps == 2)
- {
- if(value == (uint8_t)value * 0x1010101)
- goto ms;
- FILL(uint32_t);
- }
- else
- assert(0);
-#undef FILL
- }
- else
- {
- int* dswx;
- int* dswy;
-
- dswx = alloca(w * sizeof(int));
- for(int ix = 0; ix < w; ++ix)
- dswx[ix] = nv04_swizzle_bits(dst->x + ix, 0, dst->z, dst->w, dst->h, dst->d);
- dswy = alloca(h * sizeof(int));
- for(int iy = 0; iy < h; ++iy)
- dswy[iy] = nv04_swizzle_bits(0, dst->y + iy, dst->z, dst->w, dst->h, dst->d);
-
-#define FILL(T) do { \
- T tvalue = (T)value; \
- for(int iy = 0; iy < h; ++iy) \
- { \
- T* pdst = (T*)mdst + dswy[iy]; \
- for(int ix = 0; ix < w; ++ix) \
- { \
- assert((uint8_t*)&pdst[dswx[ix] + 1] <= (uint8_t*)dst->bo->map + dst->bo->size); \
- pdst[dswx[ix]] = tvalue; \
- } \
- } \
- } while(0)
-
- if(dst->bpps == 0)
- FILL(uint8_t);
- else if(dst->bpps == 1)
- FILL(uint16_t);
- else if(dst->bpps == 2)
- FILL(uint32_t);
- else
- assert(0 && "unhandled bpp");
-#undef FILL
- }
-
- nouveau_bo_unmap(dst->bo);
-}
-
-static inline int
-nv04_region_cs2d_format(struct nv04_region* rgn)
-{
- switch(rgn->bpps) {
- case 0:
- return NV04_CONTEXT_SURFACES_2D_FORMAT_Y8;
- case 1:
- if(rgn->one_bits >= 1)
- return NV04_CONTEXT_SURFACES_2D_FORMAT_X1R5G5B5_X1R5G5B5;
- else
- return NV04_CONTEXT_SURFACES_2D_FORMAT_R5G6B5;
- case 2:
- if(rgn->one_bits >= 8)
- return NV04_CONTEXT_SURFACES_2D_FORMAT_X8R8G8B8_X8R8G8B8;
- else
- return NV04_CONTEXT_SURFACES_2D_FORMAT_A8R8G8B8;
- default:
- return -1;
- }
-}
-
-static inline int
-nv04_region_sifm_format(struct nv04_region* rgn)
-{
- switch(rgn->bpps) {
- case 0:
- return NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_Y8;
- case 1:
- if(rgn->one_bits >= 1)
- return NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_X1R5G5B5;
- else
- return NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_R5G6B5;
- case 2:
- if(rgn->one_bits >= 8)
- return NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_X8R8G8B8;
- else
- return NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_FORMAT_A8R8G8B8;
- default:
- return -1;
- }
-}
-static void
-nv04_region_copy_swizzle(struct nv04_2d_context *ctx,
- struct nv04_region* dst,
- struct nv04_region* src,
- int w, int h)
-{
- struct nouveau_channel *chan = ctx->swzsurf->channel;
- struct nouveau_grobj *swzsurf = ctx->swzsurf;
- struct nouveau_grobj *sifm = ctx->sifm;
- int cs2d_format = nv04_region_cs2d_format(dst);
- int sifm_format = nv04_region_sifm_format(src);
- /* Max width & height may not be the same on all HW, but must be POT */
- unsigned max_shift = 10;
- unsigned cw = 1 << max_shift;
- unsigned ch = 1 << max_shift;
- unsigned sx = dst->x >> max_shift;
- unsigned sy = dst->y >> max_shift;
- unsigned ex = (dst->x + w - 1) >> max_shift;
- unsigned ey = (dst->y + h - 1) >> max_shift;
- unsigned chunks = (ex - sx + 1) * (ey - sy + 1);
- unsigned chunk_size;
- if(dst->w < cw)
- cw = dst->w;
- if(dst->h < ch)
- ch = dst->h;
- chunk_size = cw * ch << dst->bpps;
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tRGN_COPY_SWIZZLE [%i, %i: %i] ", w, h, dst->bpps);
- for(int i = 0; i < 2; ++i)
- {
- nv04_region_print(i ? src : dst);
- fprintf(stderr, i ? "\n" : " <- ");
- }
-#endif
-
- nv04_region_assert(dst, w, h);
- nv04_region_assert(src, w, h);
-
- MARK_RING (chan, 8 + chunks * 17, 2 + chunks * 2);
-
- BEGIN_RING(chan, swzsurf, NV04_SWIZZLED_SURFACE_DMA_IMAGE, 1);
- OUT_RELOCo(chan, dst->bo,
- NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
-
- BEGIN_RING(chan, swzsurf, NV04_SWIZZLED_SURFACE_FORMAT, 1);
- OUT_RING (chan, cs2d_format |
- log2i(cw) << NV04_SWIZZLED_SURFACE_FORMAT_BASE_SIZE_U__SHIFT |
- log2i(ch) << NV04_SWIZZLED_SURFACE_FORMAT_BASE_SIZE_V__SHIFT);
-
- BEGIN_RING(chan, sifm, NV03_SCALED_IMAGE_FROM_MEMORY_DMA_IMAGE, 1);
- OUT_RELOCo(chan, src->bo,
- NOUVEAU_BO_GART | NOUVEAU_BO_VRAM | NOUVEAU_BO_RD);
- BEGIN_RING(chan, sifm, NV04_SCALED_IMAGE_FROM_MEMORY_SURFACE, 1);
- OUT_RING (chan, swzsurf->handle);
-
- assert(!(dst->offset & 63));
-
- for (int cy = sy; cy <= ey; ++cy) {
- int ry = MAX2(0, (int)(dst->y - ch * cy));
- int rh = MIN2((int)ch, (int)(dst->y - ch * cy + h)) - ry;
- for (int cx = sx; cx <= ex; ++cx) {
- int rx = MAX2(0, (int)(dst->x - cw * cx));
- int rw = MIN2((int)cw, (int)(dst->x - cw * cx + w)) - rx;
- unsigned dst_offset;
- unsigned src_offset;
-
- BEGIN_RING(chan, swzsurf, NV04_SWIZZLED_SURFACE_OFFSET, 1);
-
- dst_offset = dst->offset + (nv04_swizzle_bits_2d(cx * cw, cy * ch, dst->w, dst->h) << dst->bpps);
- assert(dst_offset <= dst->bo->size);
- assert(dst_offset + chunk_size <= dst->bo->size);
- OUT_RELOCl(chan, dst->bo, dst_offset,
- NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
-
- BEGIN_RING(chan, sifm, NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_CONVERSION, 9);
- OUT_RING (chan, NV03_SCALED_IMAGE_FROM_MEMORY_COLOR_CONVERSION_TRUNCATE);
- OUT_RING (chan, sifm_format);
- OUT_RING (chan, NV03_SCALED_IMAGE_FROM_MEMORY_OPERATION_SRCCOPY);
- OUT_RING (chan, rx | (ry << NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_POINT_Y__SHIFT));
- OUT_RING (chan, rh << NV03_SCALED_IMAGE_FROM_MEMORY_CLIP_SIZE_H__SHIFT | rw);
- OUT_RING (chan, rx | (ry << NV03_SCALED_IMAGE_FROM_MEMORY_OUT_POINT_Y__SHIFT));
- OUT_RING (chan, rh << NV03_SCALED_IMAGE_FROM_MEMORY_OUT_SIZE_H__SHIFT | rw);
- OUT_RING (chan, 1 << 20);
- OUT_RING (chan, 1 << 20);
-
- BEGIN_RING(chan, sifm, NV03_SCALED_IMAGE_FROM_MEMORY_SIZE, 4);
- OUT_RING (chan, rh << NV03_SCALED_IMAGE_FROM_MEMORY_SIZE_H__SHIFT | align(rw, 8));
- OUT_RING (chan, src->pitch |
- NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_ORIGIN_CENTER |
- NV03_SCALED_IMAGE_FROM_MEMORY_FORMAT_FILTER_POINT_SAMPLE);
- src_offset = src->offset + (cy * ch + ry + src->y - dst->y) * src->pitch + ((cx * cw + rx + src->x - dst->x) << src->bpps);
- assert(src_offset <= src->bo->size);
- assert(src_offset + (src->pitch * (rh - 1)) + (rw << src->bpps) <= src->bo->size);
- OUT_RELOCl(chan, src->bo, src_offset,
- NOUVEAU_BO_GART | NOUVEAU_BO_VRAM | NOUVEAU_BO_RD);
- OUT_RING (chan, 0);
- }
- }
-}
-
-static inline void
-nv04_copy_m2mf_begin(struct nv04_2d_context *ctx, struct nouveau_bo* dstbo, struct nouveau_bo* srcbo, unsigned commands)
-{
- struct nouveau_channel *chan = ctx->m2mf->channel;
- struct nouveau_grobj *m2mf = ctx->m2mf;
- MARK_RING (chan, 3 + commands * 9, 2 + commands * 2);
- BEGIN_RING(chan, m2mf, NV04_M2MF_DMA_BUFFER_IN, 2);
- OUT_RELOCo(chan, srcbo,
- NOUVEAU_BO_GART | NOUVEAU_BO_VRAM | NOUVEAU_BO_RD);
- OUT_RELOCo(chan, dstbo,
- NOUVEAU_BO_GART | NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
-}
-
-static inline void
-nv04_copy_m2mf_body(struct nv04_2d_context *ctx, struct nouveau_bo* dstbo, int* pdstoff, unsigned dstpitch, struct nouveau_bo* srcbo, int* psrcoff, unsigned srcpitch, unsigned size, unsigned lines)
-{
- struct nouveau_channel *chan = ctx->m2mf->channel;
- struct nouveau_grobj *m2mf = ctx->m2mf;
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\t\t\tCOPY_M2MF_BODY [%i, %i] <%i[%u]> lin %u <- <%i[%u]> lin %u\n", size, lines, dstbo->handle, *pdstoff, dstpitch, srcbo->handle, *psrcoff, srcpitch);
-#endif
-
- BEGIN_RING(chan, m2mf, NV04_M2MF_OFFSET_IN, 8);
- OUT_RELOCl(chan, srcbo, *psrcoff,
- NOUVEAU_BO_VRAM | NOUVEAU_BO_GART | NOUVEAU_BO_RD);
- OUT_RELOCl(chan, dstbo, *pdstoff,
- NOUVEAU_BO_VRAM | NOUVEAU_BO_GART | NOUVEAU_BO_WR);
- OUT_RING (chan, srcpitch);
- OUT_RING (chan, dstpitch);
- OUT_RING (chan, size);
- OUT_RING (chan, lines);
- OUT_RING (chan, 0x0101);
- OUT_RING (chan, 0);
-
- *psrcoff += srcpitch * lines;
- *pdstoff += dstpitch * lines;
-}
-
-static void
-nv04_copy_m2mf(struct nv04_2d_context *ctx,
- struct nouveau_bo* dstbo, int dstoff, unsigned dstpitch,
- struct nouveau_bo* srcbo, int srcoff, unsigned srcpitch,
- unsigned size, unsigned h)
-{
- unsigned max_pitch = 32767;
- unsigned max_lines = 2047;
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\t\tCOPY_M2MF [%i, %i] <%i[%i]> lin %u <- <%i[%i]> lin %u\n", size, h, dstbo->handle, dstoff, dstpitch, srcbo->handle, srcoff, srcpitch);
-#endif
-
- if(srcpitch <= max_pitch && dstpitch <= max_pitch)
- {
- unsigned full_pages = h / max_lines;
- unsigned leftover_lines = h - full_pages * max_lines;
-
- nv04_copy_m2mf_begin(ctx, dstbo, srcbo, full_pages + !!leftover_lines);
-
- for(unsigned i = 0; i < full_pages; ++i)
- nv04_copy_m2mf_body(ctx, dstbo, &dstoff, dstpitch, srcbo, &srcoff, srcpitch, size, max_lines);
-
- if(leftover_lines)
- nv04_copy_m2mf_body(ctx, dstbo, &dstoff, dstpitch, srcbo, &srcoff, srcpitch, size, leftover_lines);
- }
- else
- {
- unsigned lines = size / max_pitch;
- unsigned leftover = size - lines * max_pitch;
- unsigned full_pages = lines / max_lines;
- unsigned leftover_lines = lines - full_pages * max_lines;
- unsigned srcgap = srcpitch - size;
- unsigned dstgap = dstpitch - size;
-
- nv04_copy_m2mf_begin(ctx, dstbo, srcbo, h * (full_pages + !!leftover_lines + !!leftover));
-
- for(unsigned i = 0; i < h; ++i)
- {
- for(unsigned j = 0; j < full_pages; ++j)
- nv04_copy_m2mf_body(ctx, dstbo, &dstoff, max_pitch, srcbo, &srcoff, max_pitch, max_pitch, max_lines);
-
- if(leftover_lines)
- nv04_copy_m2mf_body(ctx, dstbo, &dstoff, max_pitch, srcbo, &srcoff, max_pitch, max_pitch, leftover_lines);
-
- if(leftover)
- nv04_copy_m2mf_body(ctx, dstbo, &dstoff, leftover, srcbo, &srcoff, leftover, leftover, 1);
-
- srcoff += srcgap;
- dstoff += dstgap;
- }
- }
-}
-
-void
-nv04_memcpy(struct nv04_2d_context *ctx, struct nouveau_bo* dstbo, int dstoff, struct nouveau_bo* srcbo, int srcoff, unsigned size)
-{
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tMEMCPY [%i] <%i[%i]> <- <%i[%i]>\n", size, dstbo->handle, dstoff, srcbo->handle, srcoff);
-#endif
-
- nv04_copy_m2mf(ctx, dstbo, dstoff, size, srcbo, srcoff, size, size, 1);
-}
-
-static void
-nv04_region_copy_m2mf(struct nv04_2d_context *ctx, struct nv04_region *dst, struct nv04_region *src, int w, int h)
-{
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tRGN_COPY_M2MF [%i, %i: %i] ", w, h, dst->bpps);
- for(int i = 0; i < 2; ++i)
- {
- nv04_region_print(i ? src : dst);
- fprintf(stderr, i ? "\n" : " <- ");
- }
-#endif
-
- nv04_region_assert(dst, w, h);
- nv04_region_assert(src, w, h);
- assert(src->pitch);
- assert(dst->pitch);
-
- nv04_copy_m2mf(ctx,
- dst->bo, dst->offset + dst->y * dst->pitch + (dst->x << dst->bpps), dst->pitch,
- src->bo, src->offset + src->y * src->pitch + (src->x << src->bpps), src->pitch,
- w << src->bpps, h);
-}
-
-static inline void
-nv04_region_copy_blit(struct nv04_2d_context *ctx, struct nv04_region* dst, struct nv04_region* src, int w, int h)
-{
- struct nouveau_channel *chan = ctx->surf2d->channel;
- struct nouveau_grobj *surf2d = ctx->surf2d;
- struct nouveau_grobj *blit = ctx->blit;
- int cs2d_format = nv04_region_cs2d_format(dst);
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tRGN_COPY_BLIT [%i, %i: %i] ", w, h, dst->bpps);
- for(int i = 0; i < 2; ++i)
- {
- nv04_region_print(i ? src : dst);
- fprintf(stderr, i ? "\n" : " <- ");
- }
-#endif
-
- assert(!(src->pitch & 63) && src->pitch);
- assert(!(dst->pitch & 63) && dst->pitch);
- nv04_region_assert(dst, w, h);
- nv04_region_assert(src, w, h);
-
- MARK_RING (chan, 12, 4);
- BEGIN_RING(chan, surf2d, NV04_CONTEXT_SURFACES_2D_DMA_IMAGE_SOURCE, 2);
- OUT_RELOCo(chan, src->bo, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD);
- OUT_RELOCo(chan, dst->bo, NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
- BEGIN_RING(chan, surf2d, NV04_CONTEXT_SURFACES_2D_FORMAT, 4);
- OUT_RING (chan, cs2d_format);
- OUT_RING (chan, (dst->pitch << 16) | src->pitch);
- OUT_RELOCl(chan, src->bo, src->offset, NOUVEAU_BO_VRAM | NOUVEAU_BO_RD);
- OUT_RELOCl(chan, dst->bo, dst->offset, NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
-
- BEGIN_RING(chan, blit, 0x0300, 3);
- OUT_RING (chan, (src->y << 16) | src->x);
- OUT_RING (chan, (dst->y << 16) | dst->x);
- OUT_RING (chan, ( h << 16) | w);
-}
-
-/* THEOREM: a non-linearizable swizzled destination is always 64 byte aligned, except for 4x2 mipmap levels of swizzled 1bpp surfaces
- * HYPOTESIS:
- * 1. The first mipmap level is 64-byte-aligned
- * PROOF:
- * 1. Thus, all mipmaps level with a parent which is 64-byte or more in size are.
- * 2. At 1bpp, the smallest levels with a <= 32-byte parent are either Nx1 or 1xN or size <=8, thus 4x2, 2x2 or 2x4
- * 3. Nx1, 1xN, 2x4, 2x2 have all subrects linearizable. 4x2 does not.
- * 4. At 2/4bpp or more, the smallest levels with a 32-byte parent are 1xN, Nx1 or 2x2
- *
- * However, nv04_region_align handles that.
- */
-
-// 0 -> done, 1 -> do with 3D engine or CPU, -1 -> do with CPU
-// dst and src may be modified, and the possibly modified version should be passed to nv04_region_cpu if necessary
-int
-nv04_region_copy_2d(struct nv04_2d_context *ctx, struct nv04_region* dst, struct nv04_region* src,
- int w, int h, int dst_to_gpu, int src_on_gpu)
-{
- assert(src->bpps == dst->bpps);
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "RGN_COPY [%i, %i: %i] ", w, h, dst->bpps);
- for(int i = 0; i < 2; ++i)
- {
- int gpu = i ? src_on_gpu : dst_to_gpu;
- nv04_region_print(i ? src : dst);
- fprintf(stderr, " %s", gpu ? "gpu" : "cpu");
- fprintf(stderr, i ? "\n" : " <- ");
- }
-#endif
-
- // if they are contiguous and either both swizzled or both linear, reshape
- if(!dst->pitch == !src->pitch
- && nv04_region_is_contiguous(dst, w, h)
- && nv04_region_is_contiguous(src, w, h))
- {
- nv04_region_contiguous_shape(dst, &w, &h, 6);
- nv04_region_linearize_contiguous(dst, w, h);
- nv04_region_linearize_contiguous(src, w, h);
- }
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tOPT ");
- for(int i = 0; i < 2; ++i)
- {
- nv04_region_print(i ? src : dst);
- fprintf(stderr, i ? "\n" : " <- ");
- }
-#endif
-
- /* if the destination is not for GPU _and_ source is on CPU, use CPU */
- /* if the destination is not for GPU _or_ source is on CPU, use CPU only if we think it's faster than the GPU */
- /* TODO: benchmark to find out in which cases exactly we should prefer the CPU */
- if((!dst_to_gpu && !src_on_gpu)
- || (!dst->pitch && dst->d > 1)
- /* 3D swizzled destination are unwritable by the GPU, and 2D swizzled ones are readable only by the 3D engine */
- )
- return -1;
- /* there is no known way to read 2D/3D-swizzled surfaces with the 2D engine
- * ask the caller to use the 3D engine
- * If a format cannot be sampled from the 3D engine there is no point in making it swizzled, so we must not do so
- */
- else if(!src->pitch)
- {
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tCOPY_ENG3D\n");
-#endif
- return 1;
- }
- /* Setup transfer to swizzle the texture to vram if needed */
- else
- {
- if (!dst->pitch)
- {
- if(!dst_to_gpu)
- {
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tCOPY_ENG3D\n");
-#endif
- return 1;
- }
- else
- {
- assert(!nv04_region_align(dst, w, h, 6));
-
- nv04_region_copy_swizzle(ctx, dst, src, w, h);
- return 0;
- }
- }
- else
- {
- /* NV_CONTEXT_SURFACES_2D has buffer alignment restrictions, fallback
- * to NV_M2MF in this case.
- * TODO: is this also true for the source? possibly not
- * TODO: should we just always use m2mf?
- * TODO: if not, add support for multiple operations to copy_blit
- */
-
- if (!dst_to_gpu
- || w > 2047
- || h > 2047
- || (w & 1)
- || nv04_region_align(src, w, h, 6)
- || nv04_region_align(dst, w, h, 6)
- )
- nv04_region_copy_m2mf(ctx, dst, src, w, h);
- else
- nv04_region_copy_blit(ctx, dst, src, w, h);
-
- return 0;
- }
- }
-}
-
-static inline void
-nv04_region_fill_gdirect(struct nv04_2d_context *ctx, struct nv04_region* dst, int w, int h, unsigned value)
-{
- struct nouveau_channel *chan = ctx->surf2d->channel;
- struct nouveau_grobj *surf2d = ctx->surf2d;
- struct nouveau_grobj *rect = ctx->rect;
- int cs2d_format, gdirect_format;
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tFILL_GDIRECT\n");
-#endif
-
- assert(!(dst->pitch & 63) && dst->pitch);
- nv04_region_assert(dst, w, h);
-
- switch(dst->bpps)
- {
- case 0:
- gdirect_format = NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT_A8R8G8B8;
- cs2d_format = NV04_CONTEXT_SURFACES_2D_FORMAT_Y8;
- break;
- case 1:
- gdirect_format = NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT_A16R5G6B5;
- cs2d_format = NV04_CONTEXT_SURFACES_2D_FORMAT_Y16;
- break;
- case 2:
- gdirect_format = NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT_A8R8G8B8;
- cs2d_format = NV04_CONTEXT_SURFACES_2D_FORMAT_Y32;
- break;
- default:
- assert(0);
- gdirect_format = 0;
- cs2d_format = 0;
- break;
- }
-
- MARK_RING (chan, 15, 4);
- BEGIN_RING(chan, surf2d, NV04_CONTEXT_SURFACES_2D_DMA_IMAGE_SOURCE, 2);
- OUT_RELOCo(chan, dst->bo, NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
- OUT_RELOCo(chan, dst->bo, NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
- BEGIN_RING(chan, surf2d, NV04_CONTEXT_SURFACES_2D_FORMAT, 4);
- OUT_RING (chan, cs2d_format);
- OUT_RING (chan, (dst->pitch << 16) | dst->pitch);
- OUT_RELOCl(chan, dst->bo, dst->offset, NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
- OUT_RELOCl(chan, dst->bo, dst->offset, NOUVEAU_BO_VRAM | NOUVEAU_BO_WR);
-
- BEGIN_RING(chan, rect, NV04_GDI_RECTANGLE_TEXT_COLOR_FORMAT, 1);
- OUT_RING (chan, gdirect_format);
- BEGIN_RING(chan, rect, NV04_GDI_RECTANGLE_TEXT_COLOR1_A, 1);
- OUT_RING (chan, value);
- BEGIN_RING(chan, rect, NV04_GDI_RECTANGLE_TEXT_UNCLIPPED_RECTANGLE_POINT(0), 2);
- OUT_RING (chan, (dst->x << 16) | dst->y);
- OUT_RING (chan, ( w << 16) | h);
-}
-
-int
-nv04_region_fill_2d(struct nv04_2d_context *ctx, struct nv04_region *dst,
- int w, int h, unsigned value)
-{
- if(!w || !h)
- return 0;
-
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "FILL [%i, %i: %i] ", w, h, dst->bpps);
- nv04_region_print(dst);
- fprintf(stderr, " <- 0x%x\n", value);
-#endif
-
- if(nv04_region_is_contiguous(dst, w, h))
- {
- nv04_region_contiguous_shape(dst, &w, &h, 6);
- nv04_region_linearize_contiguous(dst, w, h);
- }
-
- // TODO: maybe do intermediate copies for some cases instead of using the 3D engine/CPU
- /* GdiRect doesn't work together with swzsurf, so the 3D engine, or an intermediate copy, is the only option here */
- if(!dst->pitch)
- {
-#ifdef NV04_REGION_DEBUG
- fprintf(stderr, "\tFILL_ENG3D\n");
-#endif
- return 1;
- }
- else if(!nv04_region_align(dst, w, h, 6))
- {
- nv04_region_fill_gdirect(ctx, dst, w, h, value);
- return 0;
- }
- else
- return -1;
-}
-
-
-void
-nv04_2d_context_takedown(struct nv04_2d_context *ctx)
-{
- nouveau_notifier_free(&ctx->ntfy);
- nouveau_grobj_free(&ctx->m2mf);
- nouveau_grobj_free(&ctx->surf2d);
- nouveau_grobj_free(&ctx->swzsurf);
- nouveau_grobj_free(&ctx->rect);
- nouveau_grobj_free(&ctx->blit);
- nouveau_grobj_free(&ctx->sifm);
-
- free(ctx);
-}
-
-struct nv04_2d_context *
-nv04_2d_context_init(struct nouveau_channel* chan)
-{
- struct nv04_2d_context *ctx = calloc(1, sizeof(struct nv04_2d_context));
- unsigned handle = 0x88000000, class;
- int ret;
-
- if (!ctx)
- return NULL;
-
- ret = nouveau_notifier_alloc(chan, handle++, 1, &ctx->ntfy);
- if (ret) {
- nv04_2d_context_takedown(ctx);
- return NULL;
- }
-
- ret = nouveau_grobj_alloc(chan, handle++, 0x0039, &ctx->m2mf);
- if (ret) {
- nv04_2d_context_takedown(ctx);
- return NULL;
- }
-
- BEGIN_RING(chan, ctx->m2mf, NV04_M2MF_DMA_NOTIFY, 1);
- OUT_RING (chan, ctx->ntfy->handle);
-
- if (chan->device->chipset < 0x10)
- class = NV04_CONTEXT_SURFACES_2D;
- else
- class = NV10_CONTEXT_SURFACES_2D;
-
- ret = nouveau_grobj_alloc(chan, handle++, class, &ctx->surf2d);
- if (ret) {
- nv04_2d_context_takedown(ctx);
- return NULL;
- }
-
- BEGIN_RING(chan, ctx->surf2d,
- NV04_CONTEXT_SURFACES_2D_DMA_IMAGE_SOURCE, 2);
- OUT_RING (chan, chan->vram->handle);
- OUT_RING (chan, chan->vram->handle);
-
- if (chan->device->chipset < 0x10)
- class = NV04_IMAGE_BLIT;
- else
- class = NV11_IMAGE_BLIT;
-
- ret = nouveau_grobj_alloc(chan, handle++, class, &ctx->blit);
- if (ret) {
- nv04_2d_context_takedown(ctx);
- return NULL;
- }
-
- BEGIN_RING(chan, ctx->blit, NV01_IMAGE_BLIT_DMA_NOTIFY, 1);
- OUT_RING (chan, ctx->ntfy->handle);
- BEGIN_RING(chan, ctx->blit, NV04_IMAGE_BLIT_SURFACES, 1);
- OUT_RING (chan, ctx->surf2d->handle);
- BEGIN_RING(chan, ctx->blit, NV01_IMAGE_BLIT_OPERATION, 1);
- OUT_RING (chan, NV01_IMAGE_BLIT_OPERATION_SRCCOPY);
-
- ret = nouveau_grobj_alloc(chan, handle++, NV04_GDI_RECTANGLE_TEXT,
- &ctx->rect);
- if (ret) {
- nv04_2d_context_takedown(ctx);
- return NULL;
- }
-
- BEGIN_RING(chan, ctx->rect, NV04_GDI_RECTANGLE_TEXT_DMA_NOTIFY, 1);
- OUT_RING (chan, ctx->ntfy->handle);
- BEGIN_RING(chan, ctx->rect, NV04_GDI_RECTANGLE_TEXT_SURFACE, 1);
- OUT_RING (chan, ctx->surf2d->handle);
- BEGIN_RING(chan, ctx->rect, NV04_GDI_RECTANGLE_TEXT_OPERATION, 1);
- OUT_RING (chan, NV04_GDI_RECTANGLE_TEXT_OPERATION_SRCCOPY);
- BEGIN_RING(chan, ctx->rect,
- NV04_GDI_RECTANGLE_TEXT_MONOCHROME_FORMAT, 1);
- OUT_RING (chan, NV04_GDI_RECTANGLE_TEXT_MONOCHROME_FORMAT_LE);
-
- switch (chan->device->chipset & 0xf0) {
- case 0x00:
- case 0x10:
- class = NV04_SWIZZLED_SURFACE;
- break;
- case 0x20:
- class = NV11_SWIZZLED_SURFACE;
- break;
- case 0x30:
- class = NV30_SWIZZLED_SURFACE;
- break;
- case 0x40:
- case 0x60:
- class = NV40_SWIZZLED_SURFACE;
- break;
- default:
- /* Famous last words: this really can't happen.. */
- assert(0);
- break;
- }
-
- ret = nouveau_grobj_alloc(chan, handle++, class, &ctx->swzsurf);
- if (ret) {
- nv04_2d_context_takedown(ctx);
- return NULL;
- }
-
- /* all the Gallium MARK_RING calculations assume no autobinding, so do that now */
- if(ctx->swzsurf->bound == NOUVEAU_GROBJ_UNBOUND)
- nouveau_grobj_autobind(ctx->swzsurf);
-
- switch (chan->device->chipset & 0xf0) {
- case 0x10:
- case 0x20:
- class = NV10_SCALED_IMAGE_FROM_MEMORY;
- break;
- case 0x30:
- class = NV30_SCALED_IMAGE_FROM_MEMORY;
- break;
- case 0x40:
- case 0x60:
- class = NV40_SCALED_IMAGE_FROM_MEMORY;
- break;
- default:
- class = NV04_SCALED_IMAGE_FROM_MEMORY;
- break;
- }
-
- ret = nouveau_grobj_alloc(chan, handle++, class, &ctx->sifm);
- if (ret) {
- nv04_2d_context_takedown(ctx);
- return NULL;
- }
-
- /* all the Gallium MARK_RING calculations assume no autobinding, so do that now */
- if(ctx->sifm->bound == NOUVEAU_GROBJ_UNBOUND)
- nouveau_grobj_autobind(ctx->sifm);
-
- return ctx;
-}
+++ /dev/null
-/**************************************************************************
- *
- * Copyright 2009 Ben Skeggs
- * Copyright 2009 Younes Manton
- * Copyright 2010 Luca Barbieri
- * All Rights Reserved.
- *
- * Permission is hereby granted, free of charge, to any person obtaining
- * a copy of this software and associated documentation files (the
- * "Software"), to deal in the Software without restriction, including
- * without limitation the rights to use, copy, modify, merge, publish,
- * distribute, sub license, and/or sell copies of the Software, and to
- * permit persons to whom the Software is furnished to do so, subject to
- * the following conditions:
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS, AUTHORS
- * AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
- * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
- * USE OR OTHER DEALINGS IN THE SOFTWARE.
- *
- * The above copyright notice and this permission notice (including the
- * next paragraph) shall be included in all copies or substantial portions
- * of the Software.
- *
- **************************************************************************/
-
-/* this code has no Mesa or Gallium dependency and can be reused in the classic Mesa driver or DDX */
-
-#ifndef __NV04_2D_H__
-#define __NV04_2D_H__
-
-struct nv04_2d_context;
-struct nouveau_channel;
-struct nouveau_bo;
-
-// NOTE: all functions taking this as a parameter will CLOBBER it (except for ->bo)
-struct nv04_region {
- struct nouveau_bo* bo;
- int offset;
- unsigned pitch; // 0 -> swizzled
- unsigned bpps; // bpp shift (0, 1, 2; 3, 4 for fp/compressed)
- unsigned one_bits; // number of high bits read and written as ones (for "no-alpha" optimization)
- unsigned x, y, z;
- unsigned w, h, d;
-};
-
-static inline void
-nv04_region_try_to_linearize(struct nv04_region* rgn)
-{
- assert(!rgn->pitch);
-
- if(rgn->d <= 1)
- {
- if(rgn->h <= 1 || rgn->w <= 2)
- rgn->pitch = rgn->w << rgn->bpps;
- }
- else
- {
- if(rgn->h <= 2 && rgn->w <= 2)
- {
- rgn->pitch = rgn->w << rgn->bpps;
- rgn->offset += rgn->z * rgn->h * rgn->pitch;
- }
- }
-}
-
-void
-nv04_memcpy(struct nv04_2d_context *ctx,
- struct nouveau_bo* dstbo, int dstoff,
- struct nouveau_bo* srcbo, int srcoff,
- unsigned size);
-
-unsigned
-nv04_region_begin(struct nv04_region* rgn, unsigned w, unsigned h);
-
-unsigned
-nv04_region_end(struct nv04_region* rgn, unsigned w, unsigned h);
-
-void
-nv04_2d_context_takedown(struct nv04_2d_context *pctx);
-
-struct nv04_2d_context *
-nv04_2d_context_init(struct nouveau_channel* chan);
-
-void
-nv04_region_copy_cpu(struct nv04_region* dst, struct nv04_region* src, int w, int h);
-
-void
-nv04_region_fill_cpu(struct nv04_region* dst, int w, int h, unsigned value);
-
-int
-nv04_region_copy_2d(struct nv04_2d_context *ctx,
- struct nv04_region* dst, struct nv04_region* src,
- int w, int h,
- int dst_to_gpu, int src_on_gpu);
-
-int
-nv04_region_fill_2d(struct nv04_2d_context *ctx,
- struct nv04_region *dst,
- int w, int h,
- unsigned value);
-
-#endif
+++ /dev/null
-#ifndef T
-{
- if(dst->bpps == 0)
-#define T uint8_t
-#include "nv04_2d_loops.h"
-#undef T
- else if(dst->bpps == 1)
-#define T uint16_t
-#include "nv04_2d_loops.h"
-#undef T
- else if(dst->bpps == 2)
-#define T uint32_t
-#include "nv04_2d_loops.h"
-#undef T
- else
- assert(0);
-}
-#else
-#ifdef SWIZZLED_COPY_LOOPS
-{
- if(!dst->pitch)
- {
- if(!src->pitch)
- {
- LOOP_Y
- {
- T* pdst = (T*)mdst + dswy[iy];
- T* psrc = (T*)msrc + sswy[iy];
- LOOP_X
- {
- assert((char*)&psrc[sswx[ix] + 1] <= ((char*)src->bo->map + src->bo->size));
- assert((char*)&pdst[dswx[ix] + 1] <= ((char*)dst->bo->map + dst->bo->size));
- pdst[dswx[ix]] = psrc[sswx[ix]];
- }
- }
- }
- else
- {
- T* psrc = (T*)(msrc + ((dir > 0) ? src->y : (src->y + h - 1)) * src->pitch) + src->x;
- LOOP_Y
- {
- T* pdst = (T*)mdst + dswy[iy];
- LOOP_X
- {
- assert((char*)&psrc[ix + 1] <= ((char*)src->bo->map + src->bo->size));
- assert((char*)&pdst[dswx[ix] + 1] <= ((char*)dst->bo->map + dst->bo->size));
- pdst[dswx[ix]] = psrc[ix];
- }
- psrc = (T*)((char*)psrc + dir * src->pitch);
- }
- }
- }
- else
- {
- T* pdst = (T*)(mdst + ((dir > 0) ? dst->y : (dst->y + h - 1)) * dst->pitch) + dst->x;
- LOOP_Y
- {
- T* psrc = (T*)msrc + sswy[iy];
- LOOP_X
- {
- assert((char*)&psrc[sswx[ix] + 1] <= ((char*)src->bo->map + src->bo->size));
- assert((char*)&pdst[ix + 1] <= ((char*)dst->bo->map + dst->bo->size));
- pdst[ix] = psrc[sswx[ix]];
- }
- pdst = (T*)((char*)pdst + dir * dst->pitch);
- }
- }
-}
-#endif
-#endif
+++ /dev/null
-#ifndef NV30_40_3D_XML
-#define NV30_40_3D_XML
-
-/* Autogenerated file, DO NOT EDIT manually!
-
-This file was generated by the rules-ng-ng headergen tool in this git repository:
-http://0x04.net/cgit/index.cgi/rules-ng-ng
-git clone git://0x04.net/rules-ng-ng
-
-The rules-ng-ng source files this header was generated from are:
-- nv30-40_3d.xml ( 31709 bytes, from 2010-09-05 08:00:50)
-- copyright.xml ( 6503 bytes, from 2010-04-10 23:15:50)
-- nv_3ddefs.xml ( 15391 bytes, from 2010-09-05 08:00:46)
-- nv_defs.xml ( 4437 bytes, from 2010-08-05 19:38:53)
-- nv_object.xml ( 10424 bytes, from 2010-08-05 19:38:53)
-- nvchipsets.xml ( 2824 bytes, from 2010-08-05 19:38:53)
-
-Copyright (C) 2006-2010 by the following authors:
-- Artur Huillet <arthur.huillet@free.fr> (ahuillet)
-- Ben Skeggs (darktama, darktama_)
-- B. R. <koala_br@users.sourceforge.net> (koala_br)
-- Carlos Martin <carlosmn@users.sf.net> (carlosmn)
-- Christoph Bumiller <e0425955@student.tuwien.ac.at> (calim, chrisbmr)
-- Dawid Gajownik <gajownik@users.sf.net> (gajownik)
-- Dmitry Baryshkov
-- Dmitry Eremin-Solenikov <lumag@users.sf.net> (lumag)
-- EdB <edb_@users.sf.net> (edb_)
-- Erik Waling <erikwailing@users.sf.net> (erikwaling)
-- Francisco Jerez <currojerez@riseup.net> (curro, curro_, currojerez)
-- imirkin <imirkin@users.sf.net> (imirkin)
-- jb17bsome <jb17bsome@bellsouth.net> (jb17bsome)
-- Jeremy Kolb <kjeremy@users.sf.net> (kjeremy)
-- Laurent Carlier <lordheavym@gmail.com> (lordheavy)
-- Luca Barbieri <luca@luca-barbieri.com> (lb, lb1)
-- Maarten Maathuis <madman2003@gmail.com> (stillunknown)
-- Marcin Kościelnicki <koriakin@0x04.net> (mwk, koriakin)
-- Mark Carey <mark.carey@gmail.com> (careym)
-- Matthieu Castet <matthieu.castet@parrot.com> (mat-c)
-- nvidiaman <nvidiaman@users.sf.net> (nvidiaman)
-- Patrice Mandin <mandin.patrice@orange.fr> (pmandin, pmdata)
-- Pekka Paalanen <pq@iki.fi> (pq, ppaalanen)
-- Peter Popov <ironpeter@users.sf.net> (ironpeter)
-- Richard Hughes <hughsient@users.sf.net> (hughsient)
-- Rudi Cilibrasi <cilibrar@users.sf.net> (cilibrar)
-- Serge Martin
-- Simon Raffeiner
-- Stephane Loeuillet <leroutier@users.sf.net> (leroutier)
-- Stephane Marchesin <stephane.marchesin@gmail.com> (marcheu)
-- sturmflut <sturmflut@users.sf.net> (sturmflut)
-- Sylvain Munaut <tnt@246tNt.com>
-- Victor Stinner <victor.stinner@haypocalc.com> (haypo)
-- Wladmir van der Laan <laanwj@gmail.com> (miathan6)
-- Younes Manton <younes.m@gmail.com> (ymanton)
-
-Permission is hereby granted, free of charge, to any person obtaining
-a copy of this software and associated documentation files (the
-"Software"), to deal in the Software without restriction, including
-without limitation the rights to use, copy, modify, merge, publish,
-distribute, sublicense, and/or sell copies of the Software, and to
-permit persons to whom the Software is furnished to do so, subject to
-the following conditions:
-
-The above copyright notice and this permission notice (including the
-next paragraph) shall be included in all copies or substantial
-portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
-EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
-MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
-IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
-LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
-OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
-WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
-*/
-
-
-
-#define NV30_3D_DMA_NOTIFY 0x00000180
-
-#define NV30_3D_DMA_TEXTURE0 0x00000184
-
-#define NV30_3D_DMA_TEXTURE1 0x00000188
-
-#define NV30_3D_DMA_COLOR1 0x0000018c
-
-#define NV30_3D_DMA_UNK190 0x00000190
-
-#define NV30_3D_DMA_COLOR0 0x00000194
-
-#define NV30_3D_DMA_ZETA 0x00000198
-
-#define NV30_3D_DMA_VTXBUF0 0x0000019c
-
-#define NV30_3D_DMA_VTXBUF1 0x000001a0
-
-#define NV30_3D_DMA_FENCE 0x000001a4
-
-#define NV30_3D_DMA_QUERY 0x000001a8
-
-#define NV30_3D_DMA_UNK1AC 0x000001ac
-
-#define NV30_3D_DMA_UNK1B0 0x000001b0
-
-#define NV40_3D_DMA_COLOR2 0x000001b4
-
-#define NV40_3D_DMA_COLOR3 0x000001b8
-
-#define NV30_3D_RT_HORIZ 0x00000200
-#define NV30_3D_RT_HORIZ_X__MASK 0x0000ffff
-#define NV30_3D_RT_HORIZ_X__SHIFT 0
-#define NV30_3D_RT_HORIZ_W__MASK 0xffff0000
-#define NV30_3D_RT_HORIZ_W__SHIFT 16
-
-#define NV30_3D_RT_VERT 0x00000204
-#define NV30_3D_RT_VERT_Y__MASK 0x0000ffff
-#define NV30_3D_RT_VERT_Y__SHIFT 0
-#define NV30_3D_RT_VERT_H__MASK 0xffff0000
-#define NV30_3D_RT_VERT_H__SHIFT 16
-
-#define NV30_3D_RT_FORMAT 0x00000208
-#define NV30_3D_RT_FORMAT_COLOR__MASK 0x0000001f
-#define NV30_3D_RT_FORMAT_COLOR__SHIFT 0
-#define NV30_3D_RT_FORMAT_COLOR_R5G6B5 0x00000003
-#define NV30_3D_RT_FORMAT_COLOR_X8R8G8B8 0x00000005
-#define NV30_3D_RT_FORMAT_COLOR_A8R8G8B8 0x00000008
-#define NV30_3D_RT_FORMAT_COLOR_B8 0x00000009
-#define NV30_3D_RT_FORMAT_COLOR_A16B16G16R16_FLOAT 0x0000000b
-#define NV30_3D_RT_FORMAT_COLOR_A32B32G32R32_FLOAT 0x0000000c
-#define NV30_3D_RT_FORMAT_COLOR_R32_FLOAT 0x0000000d
-#define NV30_3D_RT_FORMAT_COLOR_UNK0D 0x0000000d
-#define NV30_3D_RT_FORMAT_COLOR_X8B8G8R8 0x0000000f
-#define NV30_3D_RT_FORMAT_COLOR_A8B8G8R8 0x00000010
-#define NV30_3D_RT_FORMAT_ZETA__MASK 0x000000e0
-#define NV30_3D_RT_FORMAT_ZETA__SHIFT 5
-#define NV30_3D_RT_FORMAT_ZETA_Z16 0x00000020
-#define NV30_3D_RT_FORMAT_ZETA_Z24S8 0x00000040
-#define NV30_3D_RT_FORMAT_TYPE__MASK 0x00000f00
-#define NV30_3D_RT_FORMAT_TYPE__SHIFT 8
-#define NV30_3D_RT_FORMAT_TYPE_LINEAR 0x00000100
-#define NV30_3D_RT_FORMAT_TYPE_SWIZZLED 0x00000200
-#define NV30_3D_RT_FORMAT_LOG2_WIDTH__MASK 0x00ff0000
-#define NV30_3D_RT_FORMAT_LOG2_WIDTH__SHIFT 16
-#define NV30_3D_RT_FORMAT_LOG2_HEIGHT__MASK 0xff000000
-#define NV30_3D_RT_FORMAT_LOG2_HEIGHT__SHIFT 24
-
-#define NV30_3D_COLOR0_PITCH 0x0000020c
-#define NV30_3D_COLOR0_PITCH_COLOR0__MASK 0x0000ffff
-#define NV30_3D_COLOR0_PITCH_COLOR0__SHIFT 0
-#define NV30_3D_COLOR0_PITCH_ZETA__MASK 0xffff0000
-#define NV30_3D_COLOR0_PITCH_ZETA__SHIFT 16
-
-#define NV40_3D_COLOR0_PITCH 0x0000020c
-
-#define NV30_3D_COLOR0_OFFSET 0x00000210
-
-#define NV30_3D_ZETA_OFFSET 0x00000214
-
-#define NV30_3D_COLOR1_OFFSET 0x00000218
-
-#define NV30_3D_COLOR1_PITCH 0x0000021c
-
-#define NV30_3D_RT_ENABLE 0x00000220
-#define NV30_3D_RT_ENABLE_COLOR0 0x00000001
-#define NV30_3D_RT_ENABLE_COLOR1 0x00000002
-#define NV40_3D_RT_ENABLE_COLOR2 0x00000004
-#define NV40_3D_RT_ENABLE_COLOR3 0x00000008
-#define NV30_3D_RT_ENABLE_MRT 0x00000010
-
-#define NV40_3D_ZETA_PITCH 0x0000022c
-
-#define NV30_3D_LMA_DEPTH_PITCH 0x0000022c
-
-#define NV30_3D_LMA_DEPTH_OFFSET 0x00000230
-
-#define NV30_3D_TEX_UNITS_ENABLE 0x0000023c
-#define NV30_3D_TEX_UNITS_ENABLE_TX0 0x00000001
-#define NV30_3D_TEX_UNITS_ENABLE_TX1 0x00000002
-#define NV30_3D_TEX_UNITS_ENABLE_TX2 0x00000004
-#define NV30_3D_TEX_UNITS_ENABLE_TX3 0x00000008
-#define NV30_3D_TEX_UNITS_ENABLE_TX4 0x00000010
-#define NV30_3D_TEX_UNITS_ENABLE_TX5 0x00000020
-#define NV30_3D_TEX_UNITS_ENABLE_TX6 0x00000040
-#define NV30_3D_TEX_UNITS_ENABLE_TX7 0x00000080
-
-#define NV30_3D_TEX_MATRIX_ENABLE(i0) (0x00000240 + 0x4*(i0))
-#define NV30_3D_TEX_MATRIX_ENABLE__ESIZE 0x00000004
-#define NV30_3D_TEX_MATRIX_ENABLE__LEN 0x00000008
-
-#define NV40_3D_COLOR2_PITCH 0x00000280
-
-#define NV40_3D_COLOR3_PITCH 0x00000284
-
-#define NV40_3D_COLOR2_OFFSET 0x00000288
-
-#define NV40_3D_COLOR3_OFFSET 0x0000028c
-
-#define NV30_3D_VIEWPORT_TX_ORIGIN 0x000002b8
-#define NV30_3D_VIEWPORT_TX_ORIGIN_X__MASK 0x0000ffff
-#define NV30_3D_VIEWPORT_TX_ORIGIN_X__SHIFT 0
-#define NV30_3D_VIEWPORT_TX_ORIGIN_Y__MASK 0xffff0000
-#define NV30_3D_VIEWPORT_TX_ORIGIN_Y__SHIFT 16
-
-#define NV30_3D_VIEWPORT_CLIP_MODE 0x000002bc
-
-#define NV30_3D_VIEWPORT_CLIP_HORIZ(i0) (0x000002c0 + 0x8*(i0))
-#define NV30_3D_VIEWPORT_CLIP_HORIZ__ESIZE 0x00000008
-#define NV30_3D_VIEWPORT_CLIP_HORIZ__LEN 0x00000008
-#define NV30_3D_VIEWPORT_CLIP_HORIZ_L__MASK 0x0000ffff
-#define NV30_3D_VIEWPORT_CLIP_HORIZ_L__SHIFT 0
-#define NV30_3D_VIEWPORT_CLIP_HORIZ_R__MASK 0xffff0000
-#define NV30_3D_VIEWPORT_CLIP_HORIZ_R__SHIFT 16
-
-#define NV30_3D_VIEWPORT_CLIP_VERT(i0) (0x000002c4 + 0x8*(i0))
-#define NV30_3D_VIEWPORT_CLIP_VERT__ESIZE 0x00000008
-#define NV30_3D_VIEWPORT_CLIP_VERT__LEN 0x00000008
-#define NV30_3D_VIEWPORT_CLIP_VERT_T__MASK 0x0000ffff
-#define NV30_3D_VIEWPORT_CLIP_VERT_T__SHIFT 0
-#define NV30_3D_VIEWPORT_CLIP_VERT_D__MASK 0xffff0000
-#define NV30_3D_VIEWPORT_CLIP_VERT_D__SHIFT 16
-
-#define NV30_3D_DITHER_ENABLE 0x00000300
-
-#define NV30_3D_ALPHA_FUNC_ENABLE 0x00000304
-
-#define NV30_3D_ALPHA_FUNC_FUNC 0x00000308
-#define NV30_3D_ALPHA_FUNC_FUNC_NEVER 0x00000200
-#define NV30_3D_ALPHA_FUNC_FUNC_LESS 0x00000201
-#define NV30_3D_ALPHA_FUNC_FUNC_EQUAL 0x00000202
-#define NV30_3D_ALPHA_FUNC_FUNC_LEQUAL 0x00000203
-#define NV30_3D_ALPHA_FUNC_FUNC_GREATER 0x00000204
-#define NV30_3D_ALPHA_FUNC_FUNC_NOTEQUAL 0x00000205
-#define NV30_3D_ALPHA_FUNC_FUNC_GEQUAL 0x00000206
-#define NV30_3D_ALPHA_FUNC_FUNC_ALWAYS 0x00000207
-
-#define NV30_3D_ALPHA_FUNC_REF 0x0000030c
-
-#define NV30_3D_BLEND_FUNC_ENABLE 0x00000310
-
-#define NV30_3D_BLEND_FUNC_SRC 0x00000314
-#define NV30_3D_BLEND_FUNC_SRC_RGB__MASK 0x0000ffff
-#define NV30_3D_BLEND_FUNC_SRC_RGB__SHIFT 0
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ZERO 0x00000000
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ONE 0x00000001
-#define NV30_3D_BLEND_FUNC_SRC_RGB_SRC_COLOR 0x00000300
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ONE_MINUS_SRC_COLOR 0x00000301
-#define NV30_3D_BLEND_FUNC_SRC_RGB_SRC_ALPHA 0x00000302
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ONE_MINUS_SRC_ALPHA 0x00000303
-#define NV30_3D_BLEND_FUNC_SRC_RGB_DST_ALPHA 0x00000304
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ONE_MINUS_DST_ALPHA 0x00000305
-#define NV30_3D_BLEND_FUNC_SRC_RGB_DST_COLOR 0x00000306
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ONE_MINUS_DST_COLOR 0x00000307
-#define NV30_3D_BLEND_FUNC_SRC_RGB_SRC_ALPHA_SATURATE 0x00000308
-#define NV30_3D_BLEND_FUNC_SRC_RGB_CONSTANT_COLOR 0x00008001
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ONE_MINUS_CONSTANT_COLOR 0x00008002
-#define NV30_3D_BLEND_FUNC_SRC_RGB_CONSTANT_ALPHA 0x00008003
-#define NV30_3D_BLEND_FUNC_SRC_RGB_ONE_MINUS_CONSTANT_ALPHA 0x00008004
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA__MASK 0xffff0000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA__SHIFT 16
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ZERO 0x00000000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ONE 0x00010000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_SRC_COLOR 0x03000000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ONE_MINUS_SRC_COLOR 0x03010000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_SRC_ALPHA 0x03020000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ONE_MINUS_SRC_ALPHA 0x03030000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_DST_ALPHA 0x03040000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ONE_MINUS_DST_ALPHA 0x03050000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_DST_COLOR 0x03060000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ONE_MINUS_DST_COLOR 0x03070000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_SRC_ALPHA_SATURATE 0x03080000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_CONSTANT_COLOR 0x80010000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ONE_MINUS_CONSTANT_COLOR 0x80020000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_CONSTANT_ALPHA 0x80030000
-#define NV30_3D_BLEND_FUNC_SRC_ALPHA_ONE_MINUS_CONSTANT_ALPHA 0x80040000
-
-#define NV30_3D_BLEND_FUNC_DST 0x00000318
-#define NV30_3D_BLEND_FUNC_DST_RGB__MASK 0x0000ffff
-#define NV30_3D_BLEND_FUNC_DST_RGB__SHIFT 0
-#define NV30_3D_BLEND_FUNC_DST_RGB_ZERO 0x00000000
-#define NV30_3D_BLEND_FUNC_DST_RGB_ONE 0x00000001
-#define NV30_3D_BLEND_FUNC_DST_RGB_SRC_COLOR 0x00000300
-#define NV30_3D_BLEND_FUNC_DST_RGB_ONE_MINUS_SRC_COLOR 0x00000301
-#define NV30_3D_BLEND_FUNC_DST_RGB_SRC_ALPHA 0x00000302
-#define NV30_3D_BLEND_FUNC_DST_RGB_ONE_MINUS_SRC_ALPHA 0x00000303
-#define NV30_3D_BLEND_FUNC_DST_RGB_DST_ALPHA 0x00000304
-#define NV30_3D_BLEND_FUNC_DST_RGB_ONE_MINUS_DST_ALPHA 0x00000305
-#define NV30_3D_BLEND_FUNC_DST_RGB_DST_COLOR 0x00000306
-#define NV30_3D_BLEND_FUNC_DST_RGB_ONE_MINUS_DST_COLOR 0x00000307
-#define NV30_3D_BLEND_FUNC_DST_RGB_SRC_ALPHA_SATURATE 0x00000308
-#define NV30_3D_BLEND_FUNC_DST_RGB_CONSTANT_COLOR 0x00008001
-#define NV30_3D_BLEND_FUNC_DST_RGB_ONE_MINUS_CONSTANT_COLOR 0x00008002
-#define NV30_3D_BLEND_FUNC_DST_RGB_CONSTANT_ALPHA 0x00008003
-#define NV30_3D_BLEND_FUNC_DST_RGB_ONE_MINUS_CONSTANT_ALPHA 0x00008004
-#define NV30_3D_BLEND_FUNC_DST_ALPHA__MASK 0xffff0000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA__SHIFT 16
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ZERO 0x00000000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ONE 0x00010000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_SRC_COLOR 0x03000000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ONE_MINUS_SRC_COLOR 0x03010000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_SRC_ALPHA 0x03020000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ONE_MINUS_SRC_ALPHA 0x03030000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_DST_ALPHA 0x03040000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ONE_MINUS_DST_ALPHA 0x03050000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_DST_COLOR 0x03060000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ONE_MINUS_DST_COLOR 0x03070000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_SRC_ALPHA_SATURATE 0x03080000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_CONSTANT_COLOR 0x80010000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ONE_MINUS_CONSTANT_COLOR 0x80020000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_CONSTANT_ALPHA 0x80030000
-#define NV30_3D_BLEND_FUNC_DST_ALPHA_ONE_MINUS_CONSTANT_ALPHA 0x80040000
-
-#define NV30_3D_BLEND_COLOR 0x0000031c
-#define NV30_3D_BLEND_COLOR_B__MASK 0x000000ff
-#define NV30_3D_BLEND_COLOR_B__SHIFT 0
-#define NV30_3D_BLEND_COLOR_G__MASK 0x0000ff00
-#define NV30_3D_BLEND_COLOR_G__SHIFT 8
-#define NV30_3D_BLEND_COLOR_R__MASK 0x00ff0000
-#define NV30_3D_BLEND_COLOR_R__SHIFT 16
-#define NV30_3D_BLEND_COLOR_A__MASK 0xff000000
-#define NV30_3D_BLEND_COLOR_A__SHIFT 24
-
-#define NV30_3D_BLEND_EQUATION 0x00000320
-#define NV30_3D_BLEND_EQUATION_FUNC_ADD 0x00008006
-#define NV30_3D_BLEND_EQUATION_MIN 0x00008007
-#define NV30_3D_BLEND_EQUATION_MAX 0x00008008
-#define NV30_3D_BLEND_EQUATION_FUNC_SUBTRACT 0x0000800a
-#define NV30_3D_BLEND_EQUATION_FUNC_REVERSE_SUBTRACT 0x0000800b
-
-#define NV40_3D_BLEND_EQUATION 0x00000320
-#define NV40_3D_BLEND_EQUATION_RGB__MASK 0x0000ffff
-#define NV40_3D_BLEND_EQUATION_RGB__SHIFT 0
-#define NV40_3D_BLEND_EQUATION_RGB_FUNC_ADD 0x00008006
-#define NV40_3D_BLEND_EQUATION_RGB_MIN 0x00008007
-#define NV40_3D_BLEND_EQUATION_RGB_MAX 0x00008008
-#define NV40_3D_BLEND_EQUATION_RGB_FUNC_SUBTRACT 0x0000800a
-#define NV40_3D_BLEND_EQUATION_RGB_FUNC_REVERSE_SUBTRACT 0x0000800b
-#define NV40_3D_BLEND_EQUATION_ALPHA__MASK 0xffff0000
-#define NV40_3D_BLEND_EQUATION_ALPHA__SHIFT 16
-#define NV40_3D_BLEND_EQUATION_ALPHA_FUNC_ADD 0x80060000
-#define NV40_3D_BLEND_EQUATION_ALPHA_MIN 0x80070000
-#define NV40_3D_BLEND_EQUATION_ALPHA_MAX 0x80080000
-#define NV40_3D_BLEND_EQUATION_ALPHA_FUNC_SUBTRACT 0x800a0000
-#define NV40_3D_BLEND_EQUATION_ALPHA_FUNC_REVERSE_SUBTRACT 0x800b0000
-
-#define NV30_3D_COLOR_MASK 0x00000324
-#define NV30_3D_COLOR_MASK_B 0x000000ff
-#define NV30_3D_COLOR_MASK_G 0x0000ff00
-#define NV30_3D_COLOR_MASK_R 0x00ff0000
-#define NV30_3D_COLOR_MASK_A 0xff000000
-
-#define NV30_3D_STENCIL(i0) (0x00000328 + 0x20*(i0))
-#define NV30_3D_STENCIL__ESIZE 0x00000020
-#define NV30_3D_STENCIL__LEN 0x00000002
-
-#define NV30_3D_STENCIL_ENABLE(i0) (0x00000328 + 0x20*(i0))
-
-#define NV30_3D_STENCIL_MASK(i0) (0x0000032c + 0x20*(i0))
-
-#define NV30_3D_STENCIL_FUNC_FUNC(i0) (0x00000330 + 0x20*(i0))
-#define NV30_3D_STENCIL_FUNC_FUNC_NEVER 0x00000200
-#define NV30_3D_STENCIL_FUNC_FUNC_LESS 0x00000201
-#define NV30_3D_STENCIL_FUNC_FUNC_EQUAL 0x00000202
-#define NV30_3D_STENCIL_FUNC_FUNC_LEQUAL 0x00000203
-#define NV30_3D_STENCIL_FUNC_FUNC_GREATER 0x00000204
-#define NV30_3D_STENCIL_FUNC_FUNC_NOTEQUAL 0x00000205
-#define NV30_3D_STENCIL_FUNC_FUNC_GEQUAL 0x00000206
-#define NV30_3D_STENCIL_FUNC_FUNC_ALWAYS 0x00000207
-
-#define NV30_3D_STENCIL_FUNC_REF(i0) (0x00000334 + 0x20*(i0))
-
-#define NV30_3D_STENCIL_FUNC_MASK(i0) (0x00000338 + 0x20*(i0))
-
-#define NV30_3D_STENCIL_OP_FAIL(i0) (0x0000033c + 0x20*(i0))
-#define NV30_3D_STENCIL_OP_FAIL_ZERO 0x00000000
-#define NV30_3D_STENCIL_OP_FAIL_INVERT 0x0000150a
-#define NV30_3D_STENCIL_OP_FAIL_KEEP 0x00001e00
-#define NV30_3D_STENCIL_OP_FAIL_REPLACE 0x00001e01
-#define NV30_3D_STENCIL_OP_FAIL_INCR 0x00001e02
-#define NV30_3D_STENCIL_OP_FAIL_DECR 0x00001e03
-#define NV30_3D_STENCIL_OP_FAIL_INCR_WRAP 0x00008507
-#define NV30_3D_STENCIL_OP_FAIL_DECR_WRAP 0x00008508
-
-#define NV30_3D_STENCIL_OP_ZFAIL(i0) (0x00000340 + 0x20*(i0))
-#define NV30_3D_STENCIL_OP_ZFAIL_ZERO 0x00000000
-#define NV30_3D_STENCIL_OP_ZFAIL_INVERT 0x0000150a
-#define NV30_3D_STENCIL_OP_ZFAIL_KEEP 0x00001e00
-#define NV30_3D_STENCIL_OP_ZFAIL_REPLACE 0x00001e01
-#define NV30_3D_STENCIL_OP_ZFAIL_INCR 0x00001e02
-#define NV30_3D_STENCIL_OP_ZFAIL_DECR 0x00001e03
-#define NV30_3D_STENCIL_OP_ZFAIL_INCR_WRAP 0x00008507
-#define NV30_3D_STENCIL_OP_ZFAIL_DECR_WRAP 0x00008508
-
-#define NV30_3D_STENCIL_OP_ZPASS(i0) (0x00000344 + 0x20*(i0))
-#define NV30_3D_STENCIL_OP_ZPASS_ZERO 0x00000000
-#define NV30_3D_STENCIL_OP_ZPASS_INVERT 0x0000150a
-#define NV30_3D_STENCIL_OP_ZPASS_KEEP 0x00001e00
-#define NV30_3D_STENCIL_OP_ZPASS_REPLACE 0x00001e01
-#define NV30_3D_STENCIL_OP_ZPASS_INCR 0x00001e02
-#define NV30_3D_STENCIL_OP_ZPASS_DECR 0x00001e03
-#define NV30_3D_STENCIL_OP_ZPASS_INCR_WRAP 0x00008507
-#define NV30_3D_STENCIL_OP_ZPASS_DECR_WRAP 0x00008508
-
-#define NV30_3D_SHADE_MODEL 0x00000368
-#define NV30_3D_SHADE_MODEL_FLAT 0x00001d00
-#define NV30_3D_SHADE_MODEL_SMOOTH 0x00001d01
-
-#define NV30_3D_FOG_ENABLE 0x0000036c
-
-#define NV30_3D_FOG_COLOR 0x00000370
-#define NV30_3D_FOG_COLOR_R__MASK 0x000000ff
-#define NV30_3D_FOG_COLOR_R__SHIFT 0
-#define NV30_3D_FOG_COLOR_G__MASK 0x0000ff00
-#define NV30_3D_FOG_COLOR_G__SHIFT 8
-#define NV30_3D_FOG_COLOR_B__MASK 0x00ff0000
-#define NV30_3D_FOG_COLOR_B__SHIFT 16
-#define NV30_3D_FOG_COLOR_A__MASK 0xff000000
-#define NV30_3D_FOG_COLOR_A__SHIFT 24
-
-#define NV40_3D_MRT_COLOR_MASK 0x00000370
-#define NV40_3D_MRT_COLOR_MASK_BUFFER1_A 0x00000010
-#define NV40_3D_MRT_COLOR_MASK_BUFFER1_R 0x00000020
-#define NV40_3D_MRT_COLOR_MASK_BUFFER1_G 0x00000040
-#define NV40_3D_MRT_COLOR_MASK_BUFFER1_B 0x00000080
-#define NV40_3D_MRT_COLOR_MASK_BUFFER2_A 0x00000100
-#define NV40_3D_MRT_COLOR_MASK_BUFFER2_R 0x00000200
-#define NV40_3D_MRT_COLOR_MASK_BUFFER2_G 0x00000400
-#define NV40_3D_MRT_COLOR_MASK_BUFFER2_B 0x00000800
-#define NV40_3D_MRT_COLOR_MASK_BUFFER3_A 0x00001000
-#define NV40_3D_MRT_COLOR_MASK_BUFFER3_R 0x00002000
-#define NV40_3D_MRT_COLOR_MASK_BUFFER3_G 0x00004000
-#define NV40_3D_MRT_COLOR_MASK_BUFFER3_B 0x00008000
-
-#define NV30_3D_COLOR_LOGIC_OP_ENABLE 0x00000374
-
-#define NV30_3D_COLOR_LOGIC_OP_OP 0x00000378
-#define NV30_3D_COLOR_LOGIC_OP_OP_CLEAR 0x00001500
-#define NV30_3D_COLOR_LOGIC_OP_OP_AND 0x00001501
-#define NV30_3D_COLOR_LOGIC_OP_OP_AND_REVERSE 0x00001502
-#define NV30_3D_COLOR_LOGIC_OP_OP_COPY 0x00001503
-#define NV30_3D_COLOR_LOGIC_OP_OP_AND_INVERTED 0x00001504
-#define NV30_3D_COLOR_LOGIC_OP_OP_NOOP 0x00001505
-#define NV30_3D_COLOR_LOGIC_OP_OP_XOR 0x00001506
-#define NV30_3D_COLOR_LOGIC_OP_OP_OR 0x00001507
-#define NV30_3D_COLOR_LOGIC_OP_OP_NOR 0x00001508
-#define NV30_3D_COLOR_LOGIC_OP_OP_EQUIV 0x00001509
-#define NV30_3D_COLOR_LOGIC_OP_OP_INVERT 0x0000150a
-#define NV30_3D_COLOR_LOGIC_OP_OP_OR_REVERSE 0x0000150b
-#define NV30_3D_COLOR_LOGIC_OP_OP_COPY_INVERTED 0x0000150c
-#define NV30_3D_COLOR_LOGIC_OP_OP_OR_INVERTED 0x0000150d
-#define NV30_3D_COLOR_LOGIC_OP_OP_NAND 0x0000150e
-#define NV30_3D_COLOR_LOGIC_OP_OP_SET 0x0000150f
-
-#define NV30_3D_NORMALIZE_ENABLE 0x0000037c
-
-#define NV30_3D_COLOR_MATERIAL 0x00000390
-#define NV30_3D_COLOR_MATERIAL_FRONT_EMISSION_ENABLE 0x00000001
-#define NV30_3D_COLOR_MATERIAL_FRONT_AMBIENT_ENABLE 0x00000004
-#define NV30_3D_COLOR_MATERIAL_FRONT_DIFFUSE_ENABLE 0x00000010
-#define NV30_3D_COLOR_MATERIAL_FRONT_SPECULAR_ENABLE 0x00000040
-#define NV30_3D_COLOR_MATERIAL_BACK_EMISSION_ENABLE 0x00000100
-#define NV30_3D_COLOR_MATERIAL_BACK_AMBIENT_ENABLE 0x00000400
-#define NV30_3D_COLOR_MATERIAL_BACK_DIFFUSE_ENABLE 0x00001000
-#define NV30_3D_COLOR_MATERIAL_BACK_SPECULAR_ENABLE 0x00004000
-
-#define NV30_3D_DEPTH_RANGE_NEAR 0x00000394
-
-#define NV30_3D_DEPTH_RANGE_FAR 0x00000398
-
-#define NV30_3D_COLOR_MATERIAL_FRONT 0x000003a0
-
-
-#define NV30_3D_COLOR_MATERIAL_FRONT_R 0x000003a0
-
-#define NV30_3D_COLOR_MATERIAL_FRONT_G 0x000003a4
-
-#define NV30_3D_COLOR_MATERIAL_FRONT_B 0x000003a8
-
-#define NV30_3D_COLOR_MATERIAL_FRONT_A 0x000003ac
-
-#define NV40_3D_MIPMAP_ROUNDING 0x000003b0
-#define NV40_3D_MIPMAP_ROUNDING_MODE__MASK 0x00100000
-#define NV40_3D_MIPMAP_ROUNDING_MODE__SHIFT 20
-#define NV40_3D_MIPMAP_ROUNDING_MODE_UP 0x00000000
-#define NV40_3D_MIPMAP_ROUNDING_MODE_DOWN 0x00100000
-
-#define NV30_3D_LINE_WIDTH 0x000003b8
-
-#define NV30_3D_LINE_SMOOTH_ENABLE 0x000003bc
-
-
-
-#define NV30_3D_TEX_GEN_MODE(i0, i1) (0x00000400 + 0x10*(i0) + 0x4*(i1))
-#define NV30_3D_TEX_GEN_MODE__ESIZE 0x00000004
-#define NV30_3D_TEX_GEN_MODE__LEN 0x00000004
-#define NV30_3D_TEX_GEN_MODE_FALSE 0x00000000
-#define NV30_3D_TEX_GEN_MODE_EYE_LINEAR 0x00002400
-#define NV30_3D_TEX_GEN_MODE_OBJECT_LINEAR 0x00002401
-#define NV30_3D_TEX_GEN_MODE_SPHERE_MAP 0x00002402
-#define NV30_3D_TEX_GEN_MODE_NORMAL_MAP 0x00008511
-#define NV30_3D_TEX_GEN_MODE_REFLECTION_MAP 0x00008512
-
-#define NV30_3D_MODELVIEW_MATRIX(i0) (0x00000480 + 0x4*(i0))
-#define NV30_3D_MODELVIEW_MATRIX__ESIZE 0x00000004
-#define NV30_3D_MODELVIEW_MATRIX__LEN 0x00000010
-
-#define NV30_3D_INVERSE_MODELVIEW_MATRIX(i0) (0x00000580 + 0x4*(i0))
-#define NV30_3D_INVERSE_MODELVIEW_MATRIX__ESIZE 0x00000004
-#define NV30_3D_INVERSE_MODELVIEW_MATRIX__LEN 0x0000000c
-
-#define NV30_3D_PROJECTION_MATRIX(i0) (0x00000680 + 0x4*(i0))
-#define NV30_3D_PROJECTION_MATRIX__ESIZE 0x00000004
-#define NV30_3D_PROJECTION_MATRIX__LEN 0x00000010
-
-
-#define NV30_3D_TEX_MATRIX(i0, i1) (0x000006c0 + 0x40*(i0) + 0x4*(i1))
-#define NV30_3D_TEX_MATRIX__ESIZE 0x00000004
-#define NV30_3D_TEX_MATRIX__LEN 0x00000010
-
-#define NV30_3D_SCISSOR_HORIZ 0x000008c0
-#define NV30_3D_SCISSOR_HORIZ_X__MASK 0x0000ffff
-#define NV30_3D_SCISSOR_HORIZ_X__SHIFT 0
-#define NV30_3D_SCISSOR_HORIZ_W__MASK 0xffff0000
-#define NV30_3D_SCISSOR_HORIZ_W__SHIFT 16
-
-#define NV30_3D_SCISSOR_VERT 0x000008c4
-#define NV30_3D_SCISSOR_VERT_Y__MASK 0x0000ffff
-#define NV30_3D_SCISSOR_VERT_Y__SHIFT 0
-#define NV30_3D_SCISSOR_VERT_H__MASK 0xffff0000
-#define NV30_3D_SCISSOR_VERT_H__SHIFT 16
-
-#define NV30_3D_FOG_COORD_DIST 0x000008c8
-
-#define NV30_3D_FOG_MODE 0x000008cc
-
-#define NV30_3D_FOG_EQUATION_CONSTANT 0x000008d0
-
-#define NV30_3D_FOG_EQUATION_LINEAR 0x000008d4
-
-#define NV30_3D_FOG_EQUATION_QUADRATIC 0x000008d8
-
-#define NV30_3D_FP_ACTIVE_PROGRAM 0x000008e4
-#define NV30_3D_FP_ACTIVE_PROGRAM_DMA0 0x00000001
-#define NV30_3D_FP_ACTIVE_PROGRAM_DMA1 0x00000002
-#define NV30_3D_FP_ACTIVE_PROGRAM_OFFSET__MASK 0xfffffffc
-#define NV30_3D_FP_ACTIVE_PROGRAM_OFFSET__SHIFT 2
-
-
-#define NV30_3D_RC_COLOR0 0x000008ec
-#define NV30_3D_RC_COLOR0_B__MASK 0x000000ff
-#define NV30_3D_RC_COLOR0_B__SHIFT 0
-#define NV30_3D_RC_COLOR0_G__MASK 0x0000ff00
-#define NV30_3D_RC_COLOR0_G__SHIFT 8
-#define NV30_3D_RC_COLOR0_R__MASK 0x00ff0000
-#define NV30_3D_RC_COLOR0_R__SHIFT 16
-#define NV30_3D_RC_COLOR0_A__MASK 0xff000000
-#define NV30_3D_RC_COLOR0_A__SHIFT 24
-
-#define NV30_3D_RC_COLOR1 0x000008f0
-#define NV30_3D_RC_COLOR1_B__MASK 0x000000ff
-#define NV30_3D_RC_COLOR1_B__SHIFT 0
-#define NV30_3D_RC_COLOR1_G__MASK 0x0000ff00
-#define NV30_3D_RC_COLOR1_G__SHIFT 8
-#define NV30_3D_RC_COLOR1_R__MASK 0x00ff0000
-#define NV30_3D_RC_COLOR1_R__SHIFT 16
-#define NV30_3D_RC_COLOR1_A__MASK 0xff000000
-#define NV30_3D_RC_COLOR1_A__SHIFT 24
-
-#define NV30_3D_RC_FINAL0 0x000008f4
-#define NV30_3D_RC_FINAL0_D_INPUT__MASK 0x0000000f
-#define NV30_3D_RC_FINAL0_D_INPUT__SHIFT 0
-#define NV30_3D_RC_FINAL0_D_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_FINAL0_D_INPUT_CONSTANT_COLOR0 0x00000001
-#define NV30_3D_RC_FINAL0_D_INPUT_CONSTANT_COLOR1 0x00000002
-#define NV30_3D_RC_FINAL0_D_INPUT_FOG 0x00000003
-#define NV30_3D_RC_FINAL0_D_INPUT_PRIMARY_COLOR 0x00000004
-#define NV30_3D_RC_FINAL0_D_INPUT_SECONDARY_COLOR 0x00000005
-#define NV30_3D_RC_FINAL0_D_INPUT_TEXTURE0 0x00000008
-#define NV30_3D_RC_FINAL0_D_INPUT_TEXTURE1 0x00000009
-#define NV30_3D_RC_FINAL0_D_INPUT_TEXTURE2 0x0000000a
-#define NV30_3D_RC_FINAL0_D_INPUT_TEXTURE3 0x0000000b
-#define NV30_3D_RC_FINAL0_D_INPUT_SPARE0 0x0000000c
-#define NV30_3D_RC_FINAL0_D_INPUT_SPARE1 0x0000000d
-#define NV30_3D_RC_FINAL0_D_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0000000e
-#define NV30_3D_RC_FINAL0_D_INPUT_E_TIMES_F 0x0000000f
-#define NV30_3D_RC_FINAL0_D_COMPONENT_USAGE__MASK 0x00000010
-#define NV30_3D_RC_FINAL0_D_COMPONENT_USAGE__SHIFT 4
-#define NV30_3D_RC_FINAL0_D_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_FINAL0_D_COMPONENT_USAGE_ALPHA 0x00000010
-#define NV30_3D_RC_FINAL0_D_MAPPING__MASK 0x000000e0
-#define NV30_3D_RC_FINAL0_D_MAPPING__SHIFT 5
-#define NV30_3D_RC_FINAL0_D_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_FINAL0_D_MAPPING_UNSIGNED_INVERT 0x00000020
-#define NV30_3D_RC_FINAL0_D_MAPPING_EXPAND_NORMAL 0x00000040
-#define NV30_3D_RC_FINAL0_D_MAPPING_EXPAND_NEGATE 0x00000060
-#define NV30_3D_RC_FINAL0_D_MAPPING_HALF_BIAS_NORMAL 0x00000080
-#define NV30_3D_RC_FINAL0_D_MAPPING_HALF_BIAS_NEGATE 0x000000a0
-#define NV30_3D_RC_FINAL0_D_MAPPING_SIGNED_IDENTITY 0x000000c0
-#define NV30_3D_RC_FINAL0_D_MAPPING_SIGNED_NEGATE 0x000000e0
-#define NV30_3D_RC_FINAL0_C_INPUT__MASK 0x00000f00
-#define NV30_3D_RC_FINAL0_C_INPUT__SHIFT 8
-#define NV30_3D_RC_FINAL0_C_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_FINAL0_C_INPUT_CONSTANT_COLOR0 0x00000100
-#define NV30_3D_RC_FINAL0_C_INPUT_CONSTANT_COLOR1 0x00000200
-#define NV30_3D_RC_FINAL0_C_INPUT_FOG 0x00000300
-#define NV30_3D_RC_FINAL0_C_INPUT_PRIMARY_COLOR 0x00000400
-#define NV30_3D_RC_FINAL0_C_INPUT_SECONDARY_COLOR 0x00000500
-#define NV30_3D_RC_FINAL0_C_INPUT_TEXTURE0 0x00000800
-#define NV30_3D_RC_FINAL0_C_INPUT_TEXTURE1 0x00000900
-#define NV30_3D_RC_FINAL0_C_INPUT_TEXTURE2 0x00000a00
-#define NV30_3D_RC_FINAL0_C_INPUT_TEXTURE3 0x00000b00
-#define NV30_3D_RC_FINAL0_C_INPUT_SPARE0 0x00000c00
-#define NV30_3D_RC_FINAL0_C_INPUT_SPARE1 0x00000d00
-#define NV30_3D_RC_FINAL0_C_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x00000e00
-#define NV30_3D_RC_FINAL0_C_INPUT_E_TIMES_F 0x00000f00
-#define NV30_3D_RC_FINAL0_C_COMPONENT_USAGE__MASK 0x00001000
-#define NV30_3D_RC_FINAL0_C_COMPONENT_USAGE__SHIFT 12
-#define NV30_3D_RC_FINAL0_C_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_FINAL0_C_COMPONENT_USAGE_ALPHA 0x00001000
-#define NV30_3D_RC_FINAL0_C_MAPPING__MASK 0x0000e000
-#define NV30_3D_RC_FINAL0_C_MAPPING__SHIFT 13
-#define NV30_3D_RC_FINAL0_C_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_FINAL0_C_MAPPING_UNSIGNED_INVERT 0x00002000
-#define NV30_3D_RC_FINAL0_C_MAPPING_EXPAND_NORMAL 0x00004000
-#define NV30_3D_RC_FINAL0_C_MAPPING_EXPAND_NEGATE 0x00006000
-#define NV30_3D_RC_FINAL0_C_MAPPING_HALF_BIAS_NORMAL 0x00008000
-#define NV30_3D_RC_FINAL0_C_MAPPING_HALF_BIAS_NEGATE 0x0000a000
-#define NV30_3D_RC_FINAL0_C_MAPPING_SIGNED_IDENTITY 0x0000c000
-#define NV30_3D_RC_FINAL0_C_MAPPING_SIGNED_NEGATE 0x0000e000
-#define NV30_3D_RC_FINAL0_B_INPUT__MASK 0x000f0000
-#define NV30_3D_RC_FINAL0_B_INPUT__SHIFT 16
-#define NV30_3D_RC_FINAL0_B_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_FINAL0_B_INPUT_CONSTANT_COLOR0 0x00010000
-#define NV30_3D_RC_FINAL0_B_INPUT_CONSTANT_COLOR1 0x00020000
-#define NV30_3D_RC_FINAL0_B_INPUT_FOG 0x00030000
-#define NV30_3D_RC_FINAL0_B_INPUT_PRIMARY_COLOR 0x00040000
-#define NV30_3D_RC_FINAL0_B_INPUT_SECONDARY_COLOR 0x00050000
-#define NV30_3D_RC_FINAL0_B_INPUT_TEXTURE0 0x00080000
-#define NV30_3D_RC_FINAL0_B_INPUT_TEXTURE1 0x00090000
-#define NV30_3D_RC_FINAL0_B_INPUT_TEXTURE2 0x000a0000
-#define NV30_3D_RC_FINAL0_B_INPUT_TEXTURE3 0x000b0000
-#define NV30_3D_RC_FINAL0_B_INPUT_SPARE0 0x000c0000
-#define NV30_3D_RC_FINAL0_B_INPUT_SPARE1 0x000d0000
-#define NV30_3D_RC_FINAL0_B_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x000e0000
-#define NV30_3D_RC_FINAL0_B_INPUT_E_TIMES_F 0x000f0000
-#define NV30_3D_RC_FINAL0_B_COMPONENT_USAGE__MASK 0x00100000
-#define NV30_3D_RC_FINAL0_B_COMPONENT_USAGE__SHIFT 20
-#define NV30_3D_RC_FINAL0_B_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_FINAL0_B_COMPONENT_USAGE_ALPHA 0x00100000
-#define NV30_3D_RC_FINAL0_B_MAPPING__MASK 0x00e00000
-#define NV30_3D_RC_FINAL0_B_MAPPING__SHIFT 21
-#define NV30_3D_RC_FINAL0_B_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_FINAL0_B_MAPPING_UNSIGNED_INVERT 0x00200000
-#define NV30_3D_RC_FINAL0_B_MAPPING_EXPAND_NORMAL 0x00400000
-#define NV30_3D_RC_FINAL0_B_MAPPING_EXPAND_NEGATE 0x00600000
-#define NV30_3D_RC_FINAL0_B_MAPPING_HALF_BIAS_NORMAL 0x00800000
-#define NV30_3D_RC_FINAL0_B_MAPPING_HALF_BIAS_NEGATE 0x00a00000
-#define NV30_3D_RC_FINAL0_B_MAPPING_SIGNED_IDENTITY 0x00c00000
-#define NV30_3D_RC_FINAL0_B_MAPPING_SIGNED_NEGATE 0x00e00000
-#define NV30_3D_RC_FINAL0_A_INPUT__MASK 0x0f000000
-#define NV30_3D_RC_FINAL0_A_INPUT__SHIFT 24
-#define NV30_3D_RC_FINAL0_A_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_FINAL0_A_INPUT_CONSTANT_COLOR0 0x01000000
-#define NV30_3D_RC_FINAL0_A_INPUT_CONSTANT_COLOR1 0x02000000
-#define NV30_3D_RC_FINAL0_A_INPUT_FOG 0x03000000
-#define NV30_3D_RC_FINAL0_A_INPUT_PRIMARY_COLOR 0x04000000
-#define NV30_3D_RC_FINAL0_A_INPUT_SECONDARY_COLOR 0x05000000
-#define NV30_3D_RC_FINAL0_A_INPUT_TEXTURE0 0x08000000
-#define NV30_3D_RC_FINAL0_A_INPUT_TEXTURE1 0x09000000
-#define NV30_3D_RC_FINAL0_A_INPUT_TEXTURE2 0x0a000000
-#define NV30_3D_RC_FINAL0_A_INPUT_TEXTURE3 0x0b000000
-#define NV30_3D_RC_FINAL0_A_INPUT_SPARE0 0x0c000000
-#define NV30_3D_RC_FINAL0_A_INPUT_SPARE1 0x0d000000
-#define NV30_3D_RC_FINAL0_A_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0e000000
-#define NV30_3D_RC_FINAL0_A_INPUT_E_TIMES_F 0x0f000000
-#define NV30_3D_RC_FINAL0_A_COMPONENT_USAGE__MASK 0x10000000
-#define NV30_3D_RC_FINAL0_A_COMPONENT_USAGE__SHIFT 28
-#define NV30_3D_RC_FINAL0_A_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_FINAL0_A_COMPONENT_USAGE_ALPHA 0x10000000
-#define NV30_3D_RC_FINAL0_A_MAPPING__MASK 0xe0000000
-#define NV30_3D_RC_FINAL0_A_MAPPING__SHIFT 29
-#define NV30_3D_RC_FINAL0_A_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_FINAL0_A_MAPPING_UNSIGNED_INVERT 0x20000000
-#define NV30_3D_RC_FINAL0_A_MAPPING_EXPAND_NORMAL 0x40000000
-#define NV30_3D_RC_FINAL0_A_MAPPING_EXPAND_NEGATE 0x60000000
-#define NV30_3D_RC_FINAL0_A_MAPPING_HALF_BIAS_NORMAL 0x80000000
-#define NV30_3D_RC_FINAL0_A_MAPPING_HALF_BIAS_NEGATE 0xa0000000
-#define NV30_3D_RC_FINAL0_A_MAPPING_SIGNED_IDENTITY 0xc0000000
-#define NV30_3D_RC_FINAL0_A_MAPPING_SIGNED_NEGATE 0xe0000000
-
-#define NV30_3D_RC_FINAL1 0x000008f8
-#define NV30_3D_RC_FINAL1_COLOR_SUM_CLAMP 0x00000080
-#define NV30_3D_RC_FINAL1_G_INPUT__MASK 0x00000f00
-#define NV30_3D_RC_FINAL1_G_INPUT__SHIFT 8
-#define NV30_3D_RC_FINAL1_G_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_FINAL1_G_INPUT_CONSTANT_COLOR0 0x00000100
-#define NV30_3D_RC_FINAL1_G_INPUT_CONSTANT_COLOR1 0x00000200
-#define NV30_3D_RC_FINAL1_G_INPUT_FOG 0x00000300
-#define NV30_3D_RC_FINAL1_G_INPUT_PRIMARY_COLOR 0x00000400
-#define NV30_3D_RC_FINAL1_G_INPUT_SECONDARY_COLOR 0x00000500
-#define NV30_3D_RC_FINAL1_G_INPUT_TEXTURE0 0x00000800
-#define NV30_3D_RC_FINAL1_G_INPUT_TEXTURE1 0x00000900
-#define NV30_3D_RC_FINAL1_G_INPUT_TEXTURE2 0x00000a00
-#define NV30_3D_RC_FINAL1_G_INPUT_TEXTURE3 0x00000b00
-#define NV30_3D_RC_FINAL1_G_INPUT_SPARE0 0x00000c00
-#define NV30_3D_RC_FINAL1_G_INPUT_SPARE1 0x00000d00
-#define NV30_3D_RC_FINAL1_G_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x00000e00
-#define NV30_3D_RC_FINAL1_G_INPUT_E_TIMES_F 0x00000f00
-#define NV30_3D_RC_FINAL1_G_COMPONENT_USAGE__MASK 0x00001000
-#define NV30_3D_RC_FINAL1_G_COMPONENT_USAGE__SHIFT 12
-#define NV30_3D_RC_FINAL1_G_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_FINAL1_G_COMPONENT_USAGE_ALPHA 0x00001000
-#define NV30_3D_RC_FINAL1_G_MAPPING__MASK 0x0000e000
-#define NV30_3D_RC_FINAL1_G_MAPPING__SHIFT 13
-#define NV30_3D_RC_FINAL1_G_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_FINAL1_G_MAPPING_UNSIGNED_INVERT 0x00002000
-#define NV30_3D_RC_FINAL1_G_MAPPING_EXPAND_NORMAL 0x00004000
-#define NV30_3D_RC_FINAL1_G_MAPPING_EXPAND_NEGATE 0x00006000
-#define NV30_3D_RC_FINAL1_G_MAPPING_HALF_BIAS_NORMAL 0x00008000
-#define NV30_3D_RC_FINAL1_G_MAPPING_HALF_BIAS_NEGATE 0x0000a000
-#define NV30_3D_RC_FINAL1_G_MAPPING_SIGNED_IDENTITY 0x0000c000
-#define NV30_3D_RC_FINAL1_G_MAPPING_SIGNED_NEGATE 0x0000e000
-#define NV30_3D_RC_FINAL1_F_INPUT__MASK 0x000f0000
-#define NV30_3D_RC_FINAL1_F_INPUT__SHIFT 16
-#define NV30_3D_RC_FINAL1_F_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_FINAL1_F_INPUT_CONSTANT_COLOR0 0x00010000
-#define NV30_3D_RC_FINAL1_F_INPUT_CONSTANT_COLOR1 0x00020000
-#define NV30_3D_RC_FINAL1_F_INPUT_FOG 0x00030000
-#define NV30_3D_RC_FINAL1_F_INPUT_PRIMARY_COLOR 0x00040000
-#define NV30_3D_RC_FINAL1_F_INPUT_SECONDARY_COLOR 0x00050000
-#define NV30_3D_RC_FINAL1_F_INPUT_TEXTURE0 0x00080000
-#define NV30_3D_RC_FINAL1_F_INPUT_TEXTURE1 0x00090000
-#define NV30_3D_RC_FINAL1_F_INPUT_TEXTURE2 0x000a0000
-#define NV30_3D_RC_FINAL1_F_INPUT_TEXTURE3 0x000b0000
-#define NV30_3D_RC_FINAL1_F_INPUT_SPARE0 0x000c0000
-#define NV30_3D_RC_FINAL1_F_INPUT_SPARE1 0x000d0000
-#define NV30_3D_RC_FINAL1_F_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x000e0000
-#define NV30_3D_RC_FINAL1_F_INPUT_E_TIMES_F 0x000f0000
-#define NV30_3D_RC_FINAL1_F_COMPONENT_USAGE__MASK 0x00100000
-#define NV30_3D_RC_FINAL1_F_COMPONENT_USAGE__SHIFT 20
-#define NV30_3D_RC_FINAL1_F_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_FINAL1_F_COMPONENT_USAGE_ALPHA 0x00100000
-#define NV30_3D_RC_FINAL1_F_MAPPING__MASK 0x00e00000
-#define NV30_3D_RC_FINAL1_F_MAPPING__SHIFT 21
-#define NV30_3D_RC_FINAL1_F_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_FINAL1_F_MAPPING_UNSIGNED_INVERT 0x00200000
-#define NV30_3D_RC_FINAL1_F_MAPPING_EXPAND_NORMAL 0x00400000
-#define NV30_3D_RC_FINAL1_F_MAPPING_EXPAND_NEGATE 0x00600000
-#define NV30_3D_RC_FINAL1_F_MAPPING_HALF_BIAS_NORMAL 0x00800000
-#define NV30_3D_RC_FINAL1_F_MAPPING_HALF_BIAS_NEGATE 0x00a00000
-#define NV30_3D_RC_FINAL1_F_MAPPING_SIGNED_IDENTITY 0x00c00000
-#define NV30_3D_RC_FINAL1_F_MAPPING_SIGNED_NEGATE 0x00e00000
-#define NV30_3D_RC_FINAL1_E_INPUT__MASK 0x0f000000
-#define NV30_3D_RC_FINAL1_E_INPUT__SHIFT 24
-#define NV30_3D_RC_FINAL1_E_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_FINAL1_E_INPUT_CONSTANT_COLOR0 0x01000000
-#define NV30_3D_RC_FINAL1_E_INPUT_CONSTANT_COLOR1 0x02000000
-#define NV30_3D_RC_FINAL1_E_INPUT_FOG 0x03000000
-#define NV30_3D_RC_FINAL1_E_INPUT_PRIMARY_COLOR 0x04000000
-#define NV30_3D_RC_FINAL1_E_INPUT_SECONDARY_COLOR 0x05000000
-#define NV30_3D_RC_FINAL1_E_INPUT_TEXTURE0 0x08000000
-#define NV30_3D_RC_FINAL1_E_INPUT_TEXTURE1 0x09000000
-#define NV30_3D_RC_FINAL1_E_INPUT_TEXTURE2 0x0a000000
-#define NV30_3D_RC_FINAL1_E_INPUT_TEXTURE3 0x0b000000
-#define NV30_3D_RC_FINAL1_E_INPUT_SPARE0 0x0c000000
-#define NV30_3D_RC_FINAL1_E_INPUT_SPARE1 0x0d000000
-#define NV30_3D_RC_FINAL1_E_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0e000000
-#define NV30_3D_RC_FINAL1_E_INPUT_E_TIMES_F 0x0f000000
-#define NV30_3D_RC_FINAL1_E_COMPONENT_USAGE__MASK 0x10000000
-#define NV30_3D_RC_FINAL1_E_COMPONENT_USAGE__SHIFT 28
-#define NV30_3D_RC_FINAL1_E_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_FINAL1_E_COMPONENT_USAGE_ALPHA 0x10000000
-#define NV30_3D_RC_FINAL1_E_MAPPING__MASK 0xe0000000
-#define NV30_3D_RC_FINAL1_E_MAPPING__SHIFT 29
-#define NV30_3D_RC_FINAL1_E_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_FINAL1_E_MAPPING_UNSIGNED_INVERT 0x20000000
-#define NV30_3D_RC_FINAL1_E_MAPPING_EXPAND_NORMAL 0x40000000
-#define NV30_3D_RC_FINAL1_E_MAPPING_EXPAND_NEGATE 0x60000000
-#define NV30_3D_RC_FINAL1_E_MAPPING_HALF_BIAS_NORMAL 0x80000000
-#define NV30_3D_RC_FINAL1_E_MAPPING_HALF_BIAS_NEGATE 0xa0000000
-#define NV30_3D_RC_FINAL1_E_MAPPING_SIGNED_IDENTITY 0xc0000000
-#define NV30_3D_RC_FINAL1_E_MAPPING_SIGNED_NEGATE 0xe0000000
-
-#define NV30_3D_RC_ENABLE 0x000008fc
-#define NV30_3D_RC_ENABLE_NUM_COMBINERS__MASK 0x0000000f
-#define NV30_3D_RC_ENABLE_NUM_COMBINERS__SHIFT 0
-#define NV30_3D_RC_ENABLE_STAGE_CONSTANT_COLOR0 0x0000f000
-#define NV30_3D_RC_ENABLE_STAGE_CONSTANT_COLOR1 0x000f0000
-
-
-#define NV30_3D_RC_IN_ALPHA(i0) (0x00000900 + 0x20*(i0))
-#define NV30_3D_RC_IN_ALPHA_D_INPUT__MASK 0x0000000f
-#define NV30_3D_RC_IN_ALPHA_D_INPUT__SHIFT 0
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_CONSTANT_COLOR0 0x00000001
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_CONSTANT_COLOR1 0x00000002
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_FOG 0x00000003
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_PRIMARY_COLOR 0x00000004
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_SECONDARY_COLOR 0x00000005
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_TEXTURE0 0x00000008
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_TEXTURE1 0x00000009
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_TEXTURE2 0x0000000a
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_TEXTURE3 0x0000000b
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_SPARE0 0x0000000c
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_SPARE1 0x0000000d
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0000000e
-#define NV30_3D_RC_IN_ALPHA_D_INPUT_E_TIMES_F 0x0000000f
-#define NV30_3D_RC_IN_ALPHA_D_COMPONENT_USAGE__MASK 0x00000010
-#define NV30_3D_RC_IN_ALPHA_D_COMPONENT_USAGE__SHIFT 4
-#define NV30_3D_RC_IN_ALPHA_D_COMPONENT_USAGE_BLUE 0x00000000
-#define NV30_3D_RC_IN_ALPHA_D_COMPONENT_USAGE_ALPHA 0x00000010
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING__MASK 0x000000e0
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING__SHIFT 5
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_UNSIGNED_INVERT 0x00000020
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_EXPAND_NORMAL 0x00000040
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_EXPAND_NEGATE 0x00000060
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_HALF_BIAS_NORMAL 0x00000080
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_HALF_BIAS_NEGATE 0x000000a0
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_SIGNED_IDENTITY 0x000000c0
-#define NV30_3D_RC_IN_ALPHA_D_MAPPING_SIGNED_NEGATE 0x000000e0
-#define NV30_3D_RC_IN_ALPHA_C_INPUT__MASK 0x00000f00
-#define NV30_3D_RC_IN_ALPHA_C_INPUT__SHIFT 8
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_CONSTANT_COLOR0 0x00000100
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_CONSTANT_COLOR1 0x00000200
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_FOG 0x00000300
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_PRIMARY_COLOR 0x00000400
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_SECONDARY_COLOR 0x00000500
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_TEXTURE0 0x00000800
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_TEXTURE1 0x00000900
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_TEXTURE2 0x00000a00
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_TEXTURE3 0x00000b00
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_SPARE0 0x00000c00
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_SPARE1 0x00000d00
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x00000e00
-#define NV30_3D_RC_IN_ALPHA_C_INPUT_E_TIMES_F 0x00000f00
-#define NV30_3D_RC_IN_ALPHA_C_COMPONENT_USAGE__MASK 0x00001000
-#define NV30_3D_RC_IN_ALPHA_C_COMPONENT_USAGE__SHIFT 12
-#define NV30_3D_RC_IN_ALPHA_C_COMPONENT_USAGE_BLUE 0x00000000
-#define NV30_3D_RC_IN_ALPHA_C_COMPONENT_USAGE_ALPHA 0x00001000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING__MASK 0x0000e000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING__SHIFT 13
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_UNSIGNED_INVERT 0x00002000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_EXPAND_NORMAL 0x00004000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_EXPAND_NEGATE 0x00006000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_HALF_BIAS_NORMAL 0x00008000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_HALF_BIAS_NEGATE 0x0000a000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_SIGNED_IDENTITY 0x0000c000
-#define NV30_3D_RC_IN_ALPHA_C_MAPPING_SIGNED_NEGATE 0x0000e000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT__MASK 0x000f0000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT__SHIFT 16
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_CONSTANT_COLOR0 0x00010000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_CONSTANT_COLOR1 0x00020000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_FOG 0x00030000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_PRIMARY_COLOR 0x00040000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_SECONDARY_COLOR 0x00050000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_TEXTURE0 0x00080000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_TEXTURE1 0x00090000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_TEXTURE2 0x000a0000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_TEXTURE3 0x000b0000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_SPARE0 0x000c0000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_SPARE1 0x000d0000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x000e0000
-#define NV30_3D_RC_IN_ALPHA_B_INPUT_E_TIMES_F 0x000f0000
-#define NV30_3D_RC_IN_ALPHA_B_COMPONENT_USAGE__MASK 0x00100000
-#define NV30_3D_RC_IN_ALPHA_B_COMPONENT_USAGE__SHIFT 20
-#define NV30_3D_RC_IN_ALPHA_B_COMPONENT_USAGE_BLUE 0x00000000
-#define NV30_3D_RC_IN_ALPHA_B_COMPONENT_USAGE_ALPHA 0x00100000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING__MASK 0x00e00000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING__SHIFT 21
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_UNSIGNED_INVERT 0x00200000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_EXPAND_NORMAL 0x00400000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_EXPAND_NEGATE 0x00600000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_HALF_BIAS_NORMAL 0x00800000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_HALF_BIAS_NEGATE 0x00a00000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_SIGNED_IDENTITY 0x00c00000
-#define NV30_3D_RC_IN_ALPHA_B_MAPPING_SIGNED_NEGATE 0x00e00000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT__MASK 0x0f000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT__SHIFT 24
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_CONSTANT_COLOR0 0x01000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_CONSTANT_COLOR1 0x02000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_FOG 0x03000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_PRIMARY_COLOR 0x04000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_SECONDARY_COLOR 0x05000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_TEXTURE0 0x08000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_TEXTURE1 0x09000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_TEXTURE2 0x0a000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_TEXTURE3 0x0b000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_SPARE0 0x0c000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_SPARE1 0x0d000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0e000000
-#define NV30_3D_RC_IN_ALPHA_A_INPUT_E_TIMES_F 0x0f000000
-#define NV30_3D_RC_IN_ALPHA_A_COMPONENT_USAGE__MASK 0x10000000
-#define NV30_3D_RC_IN_ALPHA_A_COMPONENT_USAGE__SHIFT 28
-#define NV30_3D_RC_IN_ALPHA_A_COMPONENT_USAGE_BLUE 0x00000000
-#define NV30_3D_RC_IN_ALPHA_A_COMPONENT_USAGE_ALPHA 0x10000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING__MASK 0xe0000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING__SHIFT 29
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_UNSIGNED_INVERT 0x20000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_EXPAND_NORMAL 0x40000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_EXPAND_NEGATE 0x60000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_HALF_BIAS_NORMAL 0x80000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_HALF_BIAS_NEGATE 0xa0000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_SIGNED_IDENTITY 0xc0000000
-#define NV30_3D_RC_IN_ALPHA_A_MAPPING_SIGNED_NEGATE 0xe0000000
-
-#define NV30_3D_RC_IN_RGB(i0) (0x00000904 + 0x20*(i0))
-#define NV30_3D_RC_IN_RGB_D_INPUT__MASK 0x0000000f
-#define NV30_3D_RC_IN_RGB_D_INPUT__SHIFT 0
-#define NV30_3D_RC_IN_RGB_D_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_RGB_D_INPUT_CONSTANT_COLOR0 0x00000001
-#define NV30_3D_RC_IN_RGB_D_INPUT_CONSTANT_COLOR1 0x00000002
-#define NV30_3D_RC_IN_RGB_D_INPUT_FOG 0x00000003
-#define NV30_3D_RC_IN_RGB_D_INPUT_PRIMARY_COLOR 0x00000004
-#define NV30_3D_RC_IN_RGB_D_INPUT_SECONDARY_COLOR 0x00000005
-#define NV30_3D_RC_IN_RGB_D_INPUT_TEXTURE0 0x00000008
-#define NV30_3D_RC_IN_RGB_D_INPUT_TEXTURE1 0x00000009
-#define NV30_3D_RC_IN_RGB_D_INPUT_TEXTURE2 0x0000000a
-#define NV30_3D_RC_IN_RGB_D_INPUT_TEXTURE3 0x0000000b
-#define NV30_3D_RC_IN_RGB_D_INPUT_SPARE0 0x0000000c
-#define NV30_3D_RC_IN_RGB_D_INPUT_SPARE1 0x0000000d
-#define NV30_3D_RC_IN_RGB_D_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0000000e
-#define NV30_3D_RC_IN_RGB_D_INPUT_E_TIMES_F 0x0000000f
-#define NV30_3D_RC_IN_RGB_D_COMPONENT_USAGE__MASK 0x00000010
-#define NV30_3D_RC_IN_RGB_D_COMPONENT_USAGE__SHIFT 4
-#define NV30_3D_RC_IN_RGB_D_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_IN_RGB_D_COMPONENT_USAGE_ALPHA 0x00000010
-#define NV30_3D_RC_IN_RGB_D_MAPPING__MASK 0x000000e0
-#define NV30_3D_RC_IN_RGB_D_MAPPING__SHIFT 5
-#define NV30_3D_RC_IN_RGB_D_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_RGB_D_MAPPING_UNSIGNED_INVERT 0x00000020
-#define NV30_3D_RC_IN_RGB_D_MAPPING_EXPAND_NORMAL 0x00000040
-#define NV30_3D_RC_IN_RGB_D_MAPPING_EXPAND_NEGATE 0x00000060
-#define NV30_3D_RC_IN_RGB_D_MAPPING_HALF_BIAS_NORMAL 0x00000080
-#define NV30_3D_RC_IN_RGB_D_MAPPING_HALF_BIAS_NEGATE 0x000000a0
-#define NV30_3D_RC_IN_RGB_D_MAPPING_SIGNED_IDENTITY 0x000000c0
-#define NV30_3D_RC_IN_RGB_D_MAPPING_SIGNED_NEGATE 0x000000e0
-#define NV30_3D_RC_IN_RGB_C_INPUT__MASK 0x00000f00
-#define NV30_3D_RC_IN_RGB_C_INPUT__SHIFT 8
-#define NV30_3D_RC_IN_RGB_C_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_RGB_C_INPUT_CONSTANT_COLOR0 0x00000100
-#define NV30_3D_RC_IN_RGB_C_INPUT_CONSTANT_COLOR1 0x00000200
-#define NV30_3D_RC_IN_RGB_C_INPUT_FOG 0x00000300
-#define NV30_3D_RC_IN_RGB_C_INPUT_PRIMARY_COLOR 0x00000400
-#define NV30_3D_RC_IN_RGB_C_INPUT_SECONDARY_COLOR 0x00000500
-#define NV30_3D_RC_IN_RGB_C_INPUT_TEXTURE0 0x00000800
-#define NV30_3D_RC_IN_RGB_C_INPUT_TEXTURE1 0x00000900
-#define NV30_3D_RC_IN_RGB_C_INPUT_TEXTURE2 0x00000a00
-#define NV30_3D_RC_IN_RGB_C_INPUT_TEXTURE3 0x00000b00
-#define NV30_3D_RC_IN_RGB_C_INPUT_SPARE0 0x00000c00
-#define NV30_3D_RC_IN_RGB_C_INPUT_SPARE1 0x00000d00
-#define NV30_3D_RC_IN_RGB_C_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x00000e00
-#define NV30_3D_RC_IN_RGB_C_INPUT_E_TIMES_F 0x00000f00
-#define NV30_3D_RC_IN_RGB_C_COMPONENT_USAGE__MASK 0x00001000
-#define NV30_3D_RC_IN_RGB_C_COMPONENT_USAGE__SHIFT 12
-#define NV30_3D_RC_IN_RGB_C_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_IN_RGB_C_COMPONENT_USAGE_ALPHA 0x00001000
-#define NV30_3D_RC_IN_RGB_C_MAPPING__MASK 0x0000e000
-#define NV30_3D_RC_IN_RGB_C_MAPPING__SHIFT 13
-#define NV30_3D_RC_IN_RGB_C_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_RGB_C_MAPPING_UNSIGNED_INVERT 0x00002000
-#define NV30_3D_RC_IN_RGB_C_MAPPING_EXPAND_NORMAL 0x00004000
-#define NV30_3D_RC_IN_RGB_C_MAPPING_EXPAND_NEGATE 0x00006000
-#define NV30_3D_RC_IN_RGB_C_MAPPING_HALF_BIAS_NORMAL 0x00008000
-#define NV30_3D_RC_IN_RGB_C_MAPPING_HALF_BIAS_NEGATE 0x0000a000
-#define NV30_3D_RC_IN_RGB_C_MAPPING_SIGNED_IDENTITY 0x0000c000
-#define NV30_3D_RC_IN_RGB_C_MAPPING_SIGNED_NEGATE 0x0000e000
-#define NV30_3D_RC_IN_RGB_B_INPUT__MASK 0x000f0000
-#define NV30_3D_RC_IN_RGB_B_INPUT__SHIFT 16
-#define NV30_3D_RC_IN_RGB_B_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_RGB_B_INPUT_CONSTANT_COLOR0 0x00010000
-#define NV30_3D_RC_IN_RGB_B_INPUT_CONSTANT_COLOR1 0x00020000
-#define NV30_3D_RC_IN_RGB_B_INPUT_FOG 0x00030000
-#define NV30_3D_RC_IN_RGB_B_INPUT_PRIMARY_COLOR 0x00040000
-#define NV30_3D_RC_IN_RGB_B_INPUT_SECONDARY_COLOR 0x00050000
-#define NV30_3D_RC_IN_RGB_B_INPUT_TEXTURE0 0x00080000
-#define NV30_3D_RC_IN_RGB_B_INPUT_TEXTURE1 0x00090000
-#define NV30_3D_RC_IN_RGB_B_INPUT_TEXTURE2 0x000a0000
-#define NV30_3D_RC_IN_RGB_B_INPUT_TEXTURE3 0x000b0000
-#define NV30_3D_RC_IN_RGB_B_INPUT_SPARE0 0x000c0000
-#define NV30_3D_RC_IN_RGB_B_INPUT_SPARE1 0x000d0000
-#define NV30_3D_RC_IN_RGB_B_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x000e0000
-#define NV30_3D_RC_IN_RGB_B_INPUT_E_TIMES_F 0x000f0000
-#define NV30_3D_RC_IN_RGB_B_COMPONENT_USAGE__MASK 0x00100000
-#define NV30_3D_RC_IN_RGB_B_COMPONENT_USAGE__SHIFT 20
-#define NV30_3D_RC_IN_RGB_B_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_IN_RGB_B_COMPONENT_USAGE_ALPHA 0x00100000
-#define NV30_3D_RC_IN_RGB_B_MAPPING__MASK 0x00e00000
-#define NV30_3D_RC_IN_RGB_B_MAPPING__SHIFT 21
-#define NV30_3D_RC_IN_RGB_B_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_RGB_B_MAPPING_UNSIGNED_INVERT 0x00200000
-#define NV30_3D_RC_IN_RGB_B_MAPPING_EXPAND_NORMAL 0x00400000
-#define NV30_3D_RC_IN_RGB_B_MAPPING_EXPAND_NEGATE 0x00600000
-#define NV30_3D_RC_IN_RGB_B_MAPPING_HALF_BIAS_NORMAL 0x00800000
-#define NV30_3D_RC_IN_RGB_B_MAPPING_HALF_BIAS_NEGATE 0x00a00000
-#define NV30_3D_RC_IN_RGB_B_MAPPING_SIGNED_IDENTITY 0x00c00000
-#define NV30_3D_RC_IN_RGB_B_MAPPING_SIGNED_NEGATE 0x00e00000
-#define NV30_3D_RC_IN_RGB_A_INPUT__MASK 0x0f000000
-#define NV30_3D_RC_IN_RGB_A_INPUT__SHIFT 24
-#define NV30_3D_RC_IN_RGB_A_INPUT_ZERO 0x00000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_CONSTANT_COLOR0 0x01000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_CONSTANT_COLOR1 0x02000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_FOG 0x03000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_PRIMARY_COLOR 0x04000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_SECONDARY_COLOR 0x05000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_TEXTURE0 0x08000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_TEXTURE1 0x09000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_TEXTURE2 0x0a000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_TEXTURE3 0x0b000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_SPARE0 0x0c000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_SPARE1 0x0d000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0e000000
-#define NV30_3D_RC_IN_RGB_A_INPUT_E_TIMES_F 0x0f000000
-#define NV30_3D_RC_IN_RGB_A_COMPONENT_USAGE__MASK 0x10000000
-#define NV30_3D_RC_IN_RGB_A_COMPONENT_USAGE__SHIFT 28
-#define NV30_3D_RC_IN_RGB_A_COMPONENT_USAGE_RGB 0x00000000
-#define NV30_3D_RC_IN_RGB_A_COMPONENT_USAGE_ALPHA 0x10000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING__MASK 0xe0000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING__SHIFT 29
-#define NV30_3D_RC_IN_RGB_A_MAPPING_UNSIGNED_IDENTITY 0x00000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING_UNSIGNED_INVERT 0x20000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING_EXPAND_NORMAL 0x40000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING_EXPAND_NEGATE 0x60000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING_HALF_BIAS_NORMAL 0x80000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING_HALF_BIAS_NEGATE 0xa0000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING_SIGNED_IDENTITY 0xc0000000
-#define NV30_3D_RC_IN_RGB_A_MAPPING_SIGNED_NEGATE 0xe0000000
-
-#define NV30_3D_RC_CONSTANT_COLOR0(i0) (0x00000908 + 0x20*(i0))
-#define NV30_3D_RC_CONSTANT_COLOR0_B__MASK 0x000000ff
-#define NV30_3D_RC_CONSTANT_COLOR0_B__SHIFT 0
-#define NV30_3D_RC_CONSTANT_COLOR0_G__MASK 0x0000ff00
-#define NV30_3D_RC_CONSTANT_COLOR0_G__SHIFT 8
-#define NV30_3D_RC_CONSTANT_COLOR0_R__MASK 0x00ff0000
-#define NV30_3D_RC_CONSTANT_COLOR0_R__SHIFT 16
-#define NV30_3D_RC_CONSTANT_COLOR0_A__MASK 0xff000000
-#define NV30_3D_RC_CONSTANT_COLOR0_A__SHIFT 24
-
-#define NV30_3D_RC_CONSTANT_COLOR1(i0) (0x0000090c + 0x20*(i0))
-#define NV30_3D_RC_CONSTANT_COLOR1_B__MASK 0x000000ff
-#define NV30_3D_RC_CONSTANT_COLOR1_B__SHIFT 0
-#define NV30_3D_RC_CONSTANT_COLOR1_G__MASK 0x0000ff00
-#define NV30_3D_RC_CONSTANT_COLOR1_G__SHIFT 8
-#define NV30_3D_RC_CONSTANT_COLOR1_R__MASK 0x00ff0000
-#define NV30_3D_RC_CONSTANT_COLOR1_R__SHIFT 16
-#define NV30_3D_RC_CONSTANT_COLOR1_A__MASK 0xff000000
-#define NV30_3D_RC_CONSTANT_COLOR1_A__SHIFT 24
-
-#define NV30_3D_RC_OUT_ALPHA(i0) (0x00000910 + 0x20*(i0))
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT__MASK 0x0000000f
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT__SHIFT 0
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_ZERO 0x00000000
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_CONSTANT_COLOR0 0x00000001
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_CONSTANT_COLOR1 0x00000002
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_FOG 0x00000003
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_PRIMARY_COLOR 0x00000004
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_SECONDARY_COLOR 0x00000005
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_TEXTURE0 0x00000008
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_TEXTURE1 0x00000009
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_TEXTURE2 0x0000000a
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_TEXTURE3 0x0000000b
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_SPARE0 0x0000000c
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_SPARE1 0x0000000d
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0000000e
-#define NV30_3D_RC_OUT_ALPHA_CD_OUTPUT_E_TIMES_F 0x0000000f
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT__MASK 0x000000f0
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT__SHIFT 4
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_ZERO 0x00000000
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_CONSTANT_COLOR0 0x00000010
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_CONSTANT_COLOR1 0x00000020
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_FOG 0x00000030
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_PRIMARY_COLOR 0x00000040
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_SECONDARY_COLOR 0x00000050
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_TEXTURE0 0x00000080
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_TEXTURE1 0x00000090
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_TEXTURE2 0x000000a0
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_TEXTURE3 0x000000b0
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_SPARE0 0x000000c0
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_SPARE1 0x000000d0
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_SPARE0_PLUS_SECONDARY_COLOR 0x000000e0
-#define NV30_3D_RC_OUT_ALPHA_AB_OUTPUT_E_TIMES_F 0x000000f0
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT__MASK 0x00000f00
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT__SHIFT 8
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_ZERO 0x00000000
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_CONSTANT_COLOR0 0x00000100
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_CONSTANT_COLOR1 0x00000200
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_FOG 0x00000300
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_PRIMARY_COLOR 0x00000400
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_SECONDARY_COLOR 0x00000500
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_TEXTURE0 0x00000800
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_TEXTURE1 0x00000900
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_TEXTURE2 0x00000a00
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_TEXTURE3 0x00000b00
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_SPARE0 0x00000c00
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_SPARE1 0x00000d00
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_SPARE0_PLUS_SECONDARY_COLOR 0x00000e00
-#define NV30_3D_RC_OUT_ALPHA_SUM_OUTPUT_E_TIMES_F 0x00000f00
-#define NV30_3D_RC_OUT_ALPHA_CD_DOT_PRODUCT 0x00001000
-#define NV30_3D_RC_OUT_ALPHA_AB_DOT_PRODUCT 0x00002000
-#define NV30_3D_RC_OUT_ALPHA_MUX_SUM 0x00004000
-#define NV30_3D_RC_OUT_ALPHA_BIAS__MASK 0x00008000
-#define NV30_3D_RC_OUT_ALPHA_BIAS__SHIFT 15
-#define NV30_3D_RC_OUT_ALPHA_BIAS_NONE 0x00000000
-#define NV30_3D_RC_OUT_ALPHA_BIAS_BIAS_BY_NEGATIVE_ONE_HALF 0x00008000
-#define NV30_3D_RC_OUT_ALPHA_SCALE__MASK 0x00030000
-#define NV30_3D_RC_OUT_ALPHA_SCALE__SHIFT 16
-#define NV30_3D_RC_OUT_ALPHA_SCALE_NONE 0x00000000
-#define NV30_3D_RC_OUT_ALPHA_SCALE_SCALE_BY_TWO 0x00010000
-#define NV30_3D_RC_OUT_ALPHA_SCALE_SCALE_BY_FOUR 0x00020000
-#define NV30_3D_RC_OUT_ALPHA_SCALE_SCALE_BY_ONE_HALF 0x00030000
-
-#define NV30_3D_RC_OUT_RGB(i0) (0x00000914 + 0x20*(i0))
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT__MASK 0x0000000f
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT__SHIFT 0
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_ZERO 0x00000000
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_CONSTANT_COLOR0 0x00000001
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_CONSTANT_COLOR1 0x00000002
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_FOG 0x00000003
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_PRIMARY_COLOR 0x00000004
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_SECONDARY_COLOR 0x00000005
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_TEXTURE0 0x00000008
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_TEXTURE1 0x00000009
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_TEXTURE2 0x0000000a
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_TEXTURE3 0x0000000b
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_SPARE0 0x0000000c
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_SPARE1 0x0000000d
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_SPARE0_PLUS_SECONDARY_COLOR 0x0000000e
-#define NV30_3D_RC_OUT_RGB_CD_OUTPUT_E_TIMES_F 0x0000000f
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT__MASK 0x000000f0
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT__SHIFT 4
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_ZERO 0x00000000
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_CONSTANT_COLOR0 0x00000010
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_CONSTANT_COLOR1 0x00000020
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_FOG 0x00000030
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_PRIMARY_COLOR 0x00000040
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_SECONDARY_COLOR 0x00000050
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_TEXTURE0 0x00000080
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_TEXTURE1 0x00000090
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_TEXTURE2 0x000000a0
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_TEXTURE3 0x000000b0
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_SPARE0 0x000000c0
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_SPARE1 0x000000d0
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_SPARE0_PLUS_SECONDARY_COLOR 0x000000e0
-#define NV30_3D_RC_OUT_RGB_AB_OUTPUT_E_TIMES_F 0x000000f0
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT__MASK 0x00000f00
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT__SHIFT 8
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_ZERO 0x00000000
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_CONSTANT_COLOR0 0x00000100
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_CONSTANT_COLOR1 0x00000200
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_FOG 0x00000300
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_PRIMARY_COLOR 0x00000400
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_SECONDARY_COLOR 0x00000500
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_TEXTURE0 0x00000800
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_TEXTURE1 0x00000900
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_TEXTURE2 0x00000a00
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_TEXTURE3 0x00000b00
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_SPARE0 0x00000c00
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_SPARE1 0x00000d00
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_SPARE0_PLUS_SECONDARY_COLOR 0x00000e00
-#define NV30_3D_RC_OUT_RGB_SUM_OUTPUT_E_TIMES_F 0x00000f00
-#define NV30_3D_RC_OUT_RGB_CD_DOT_PRODUCT 0x00001000
-#define NV30_3D_RC_OUT_RGB_AB_DOT_PRODUCT 0x00002000
-#define NV30_3D_RC_OUT_RGB_MUX_SUM 0x00004000
-#define NV30_3D_RC_OUT_RGB_BIAS__MASK 0x00008000
-#define NV30_3D_RC_OUT_RGB_BIAS__SHIFT 15
-#define NV30_3D_RC_OUT_RGB_BIAS_NONE 0x00000000
-#define NV30_3D_RC_OUT_RGB_BIAS_BIAS_BY_NEGATIVE_ONE_HALF 0x00008000
-#define NV30_3D_RC_OUT_RGB_SCALE__MASK 0x00030000
-#define NV30_3D_RC_OUT_RGB_SCALE__SHIFT 16
-#define NV30_3D_RC_OUT_RGB_SCALE_NONE 0x00000000
-#define NV30_3D_RC_OUT_RGB_SCALE_SCALE_BY_TWO 0x00010000
-#define NV30_3D_RC_OUT_RGB_SCALE_SCALE_BY_FOUR 0x00020000
-#define NV30_3D_RC_OUT_RGB_SCALE_SCALE_BY_ONE_HALF 0x00030000
-
-#define NV30_3D_VIEWPORT_HORIZ 0x00000a00
-#define NV30_3D_VIEWPORT_HORIZ_X__MASK 0x0000ffff
-#define NV30_3D_VIEWPORT_HORIZ_X__SHIFT 0
-#define NV30_3D_VIEWPORT_HORIZ_W__MASK 0xffff0000
-#define NV30_3D_VIEWPORT_HORIZ_W__SHIFT 16
-
-#define NV30_3D_VIEWPORT_VERT 0x00000a04
-#define NV30_3D_VIEWPORT_VERT_Y__MASK 0x0000ffff
-#define NV30_3D_VIEWPORT_VERT_Y__SHIFT 0
-#define NV30_3D_VIEWPORT_VERT_H__MASK 0xffff0000
-#define NV30_3D_VIEWPORT_VERT_H__SHIFT 16
-
-#define NV30_3D_LIGHT_MODEL_FRONT_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION 0x00000a10
-
-
-#define NV30_3D_LIGHT_MODEL_FRONT_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION_R 0x00000a10
-
-#define NV30_3D_LIGHT_MODEL_FRONT_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION_G 0x00000a14
-
-#define NV30_3D_LIGHT_MODEL_FRONT_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION_B 0x00000a18
-
-#define NV30_3D_VIEWPORT_TRANSLATE 0x00000a20
-
-
-#define NV30_3D_VIEWPORT_TRANSLATE_X 0x00000a20
-
-#define NV30_3D_VIEWPORT_TRANSLATE_Y 0x00000a24
-
-#define NV30_3D_VIEWPORT_TRANSLATE_Z 0x00000a28
-
-#define NV30_3D_VIEWPORT_TRANSLATE_W 0x00000a2c
-
-#define NV30_3D_VIEWPORT_SCALE 0x00000a30
-
-
-#define NV30_3D_VIEWPORT_SCALE_X 0x00000a30
-
-#define NV30_3D_VIEWPORT_SCALE_Y 0x00000a34
-
-#define NV30_3D_VIEWPORT_SCALE_Z 0x00000a38
-
-#define NV30_3D_VIEWPORT_SCALE_W 0x00000a3c
-
-#define NV30_3D_POLYGON_OFFSET_POINT_ENABLE 0x00000a60
-
-#define NV30_3D_POLYGON_OFFSET_LINE_ENABLE 0x00000a64
-
-#define NV30_3D_POLYGON_OFFSET_FILL_ENABLE 0x00000a68
-
-#define NV30_3D_DEPTH_FUNC 0x00000a6c
-#define NV30_3D_DEPTH_FUNC_NEVER 0x00000200
-#define NV30_3D_DEPTH_FUNC_LESS 0x00000201
-#define NV30_3D_DEPTH_FUNC_EQUAL 0x00000202
-#define NV30_3D_DEPTH_FUNC_LEQUAL 0x00000203
-#define NV30_3D_DEPTH_FUNC_GREATER 0x00000204
-#define NV30_3D_DEPTH_FUNC_NOTEQUAL 0x00000205
-#define NV30_3D_DEPTH_FUNC_GEQUAL 0x00000206
-#define NV30_3D_DEPTH_FUNC_ALWAYS 0x00000207
-
-#define NV30_3D_DEPTH_WRITE_ENABLE 0x00000a70
-
-#define NV30_3D_DEPTH_TEST_ENABLE 0x00000a74
-
-#define NV30_3D_POLYGON_OFFSET_FACTOR 0x00000a78
-
-#define NV30_3D_POLYGON_OFFSET_UNITS 0x00000a7c
-
-#define NV30_3D_VTX_ATTR_3I_XY(i0) (0x00000a80 + 0x8*(i0))
-#define NV30_3D_VTX_ATTR_3I_XY__ESIZE 0x00000008
-#define NV30_3D_VTX_ATTR_3I_XY__LEN 0x00000010
-#define NV30_3D_VTX_ATTR_3I_XY_X__MASK 0x0000ffff
-#define NV30_3D_VTX_ATTR_3I_XY_X__SHIFT 0
-#define NV30_3D_VTX_ATTR_3I_XY_Y__MASK 0xffff0000
-#define NV30_3D_VTX_ATTR_3I_XY_Y__SHIFT 16
-
-#define NV30_3D_VTX_ATTR_3I_Z(i0) (0x00000a84 + 0x8*(i0))
-#define NV30_3D_VTX_ATTR_3I_Z__ESIZE 0x00000008
-#define NV30_3D_VTX_ATTR_3I_Z__LEN 0x00000010
-#define NV30_3D_VTX_ATTR_3I_Z_Z__MASK 0x0000ffff
-#define NV30_3D_VTX_ATTR_3I_Z_Z__SHIFT 0
-
-#define NV30_3D_TEX_FILTER_OPTIMIZATION(i0) (0x00000b00 + 0x4*(i0))
-#define NV30_3D_TEX_FILTER_OPTIMIZATION__ESIZE 0x00000004
-#define NV30_3D_TEX_FILTER_OPTIMIZATION__LEN 0x00000004
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_TRILINEAR__MASK 0x0000001f
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_TRILINEAR__SHIFT 0
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_TRILINEAR_OFF 0x00000000
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_TRILINEAR_HIGH_QUALITY 0x00000004
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_TRILINEAR_QUALITY 0x00000006
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_TRILINEAR_PERFORMANCE 0x00000008
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_TRILINEAR_HIGH_PERFORMANCE 0x00000018
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_ANISO_SAMPLE__MASK 0x000001c0
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_ANISO_SAMPLE__SHIFT 6
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_ANISO_SAMPLE_OFF 0x00000000
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_ANISO_SAMPLE_HIGH_QUALITY 0x000000c0
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_ANISO_SAMPLE_QUALITY 0x000001c0
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_ANISO_SAMPLE_PERFORMANCE 0x00000140
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_UNKNOWN__MASK 0x00007c00
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_UNKNOWN__SHIFT 10
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_UNKNOWN_OFF 0x00000000
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_UNKNOWN_PARTIAL 0x00002c00
-#define NV40_3D_TEX_FILTER_OPTIMIZATION_UNKNOWN_FULL 0x00007c00
-
-#define NV40_3D_UNK0B40(i0) (0x00000b40 + 0x4*(i0))
-#define NV40_3D_UNK0B40__ESIZE 0x00000004
-#define NV40_3D_UNK0B40__LEN 0x00000008
-
-#define NV30_3D_VP_UPLOAD_INST(i0) (0x00000b80 + 0x4*(i0))
-#define NV30_3D_VP_UPLOAD_INST__ESIZE 0x00000004
-#define NV30_3D_VP_UPLOAD_INST__LEN 0x00000004
-
-
-#define NV30_3D_TEX_CLIP_PLANE(i0) (0x00000e00 + 0x10*(i0))
-
-
-#define NV30_3D_TEX_CLIP_PLANE_X(i0) (0x00000e00 + 0x10*(i0))
-
-#define NV30_3D_TEX_CLIP_PLANE_Y(i0) (0x00000e04 + 0x10*(i0))
-
-#define NV30_3D_TEX_CLIP_PLANE_Z(i0) (0x00000e08 + 0x10*(i0))
-
-#define NV30_3D_TEX_CLIP_PLANE_W(i0) (0x00000e0c + 0x10*(i0))
-
-#define NV30_3D_LIGHT 0x00001000
-
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_AMBIENT(i0) (0x00001000 + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_AMBIENT_R(i0) (0x00001000 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_AMBIENT_G(i0) (0x00001004 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_AMBIENT_B(i0) (0x00001008 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_DIFFUSE(i0) (0x0000100c + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_DIFFUSE_R(i0) (0x0000100c + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_DIFFUSE_G(i0) (0x00001010 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_DIFFUSE_B(i0) (0x00001014 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_SPECULAR(i0) (0x00001018 + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_SPECULAR_R(i0) (0x00001018 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_SPECULAR_G(i0) (0x0000101c + 0x40*(i0))
-
-#define NV30_3D_LIGHT_FRONT_SIDE_PRODUCT_SPECULAR_B(i0) (0x00001020 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_UNK24(i0) (0x00001024 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_HALF_VECTOR(i0) (0x00001028 + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_HALF_VECTOR_X(i0) (0x00001028 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_HALF_VECTOR_Y(i0) (0x0000102c + 0x40*(i0))
-
-#define NV30_3D_LIGHT_HALF_VECTOR_Z(i0) (0x00001030 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_DIRECTION(i0) (0x00001034 + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_DIRECTION_X(i0) (0x00001034 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_DIRECTION_Y(i0) (0x00001038 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_DIRECTION_Z(i0) (0x0000103c + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_SPOT_CUTOFF_A(i0) (0x00001200 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_SPOT_CUTOFF_B(i0) (0x00001204 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_SPOT_CUTOFF_C(i0) (0x00001208 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_SPOT_DIR(i0) (0x0000120c + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_SPOT_DIR_X(i0) (0x0000120c + 0x40*(i0))
-
-#define NV30_3D_LIGHT_SPOT_DIR_Y(i0) (0x00001210 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_SPOT_DIR_Z(i0) (0x00001214 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_SPOT_CUTOFF_D(i0) (0x00001218 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_POSITION(i0) (0x0000121c + 0x40*(i0))
-
-
-#define NV30_3D_LIGHT_POSITION_X(i0) (0x0000121c + 0x40*(i0))
-
-#define NV30_3D_LIGHT_POSITION_Y(i0) (0x00001220 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_POSITION_Z(i0) (0x00001224 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_ATTENUATION(i0) (0x00001228 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_ATTENUATION_CONSTANT(i0) (0x00001228 + 0x40*(i0))
-
-#define NV30_3D_LIGHT_ATTENUATION_LINEAR(i0) (0x0000122c + 0x40*(i0))
-
-#define NV30_3D_LIGHT_ATTENUATION_QUADRATIC(i0) (0x00001230 + 0x40*(i0))
-
-#define NV30_3D_FRONT_MATERIAL_SHININESS(i0) (0x00001400 + 0x4*(i0))
-#define NV30_3D_FRONT_MATERIAL_SHININESS__ESIZE 0x00000004
-#define NV30_3D_FRONT_MATERIAL_SHININESS__LEN 0x00000006
-
-#define NV30_3D_ENABLED_LIGHTS 0x00001420
-
-#define NV30_3D_VERTEX_TWO_SIDE_ENABLE 0x0000142c
-
-#define NV30_3D_FP_REG_CONTROL 0x00001450
-#define NV30_3D_FP_REG_CONTROL_UNK0__MASK 0x0000ffff
-#define NV30_3D_FP_REG_CONTROL_UNK0__SHIFT 0
-#define NV30_3D_FP_REG_CONTROL_UNK1__MASK 0xffff0000
-#define NV30_3D_FP_REG_CONTROL_UNK1__SHIFT 16
-
-#define NV30_3D_FLATSHADE_FIRST 0x00001454
-
-#define NV30_3D_EDGEFLAG 0x0000145c
-#define NV30_3D_EDGEFLAG_ENABLE 0x00000001
-
-#define NV30_3D_VP_CLIP_PLANES_ENABLE 0x00001478
-#define NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE0 0x00000002
-#define NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE1 0x00000020
-#define NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE2 0x00000200
-#define NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE3 0x00002000
-#define NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE4 0x00020000
-#define NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE5 0x00200000
-
-#define NV30_3D_POLYGON_STIPPLE_ENABLE 0x0000147c
-
-#define NV30_3D_POLYGON_STIPPLE_PATTERN(i0) (0x00001480 + 0x4*(i0))
-#define NV30_3D_POLYGON_STIPPLE_PATTERN__ESIZE 0x00000004
-#define NV30_3D_POLYGON_STIPPLE_PATTERN__LEN 0x00000020
-
-#define NV30_3D_VTX_ATTR_3F(i0) (0x00001500 + 0x10*(i0))
-#define NV30_3D_VTX_ATTR_3F__ESIZE 0x00000010
-#define NV30_3D_VTX_ATTR_3F__LEN 0x00000010
-
-
-#define NV30_3D_VTX_ATTR_3F_X(i0) (0x00001500 + 0x10*(i0))
-
-#define NV30_3D_VTX_ATTR_3F_Y(i0) (0x00001504 + 0x10*(i0))
-
-#define NV30_3D_VTX_ATTR_3F_Z(i0) (0x00001508 + 0x10*(i0))
-
-
-#define NV30_3D_VP_CLIP_PLANE(i0, i1) (0x00001600 + 0x10*(i0) + 0x4*(i1))
-#define NV30_3D_VP_CLIP_PLANE__ESIZE 0x00000004
-#define NV30_3D_VP_CLIP_PLANE__LEN 0x00000004
-
-#define NV30_3D_VTXBUF(i0) (0x00001680 + 0x4*(i0))
-#define NV30_3D_VTXBUF__ESIZE 0x00000004
-#define NV30_3D_VTXBUF__LEN 0x00000010
-#define NV30_3D_VTXBUF_OFFSET__MASK 0x0fffffff
-#define NV30_3D_VTXBUF_OFFSET__SHIFT 0
-#define NV30_3D_VTXBUF_DMA1 0x80000000
-
-#define NV40_3D_VTX_CACHE_INVALIDATE 0x00001714
-
-#define NV30_3D_VTXFMT(i0) (0x00001740 + 0x4*(i0))
-#define NV30_3D_VTXFMT__ESIZE 0x00000004
-#define NV30_3D_VTXFMT__LEN 0x00000010
-#define NV30_3D_VTXFMT_TYPE__MASK 0x0000000f
-#define NV30_3D_VTXFMT_TYPE__SHIFT 0
-#define NV30_3D_VTXFMT_TYPE_B8G8R8A8_UNORM 0x00000000
-#define NV30_3D_VTXFMT_TYPE_V16_SNORM 0x00000001
-#define NV30_3D_VTXFMT_TYPE_V32_FLOAT 0x00000002
-#define NV30_3D_VTXFMT_TYPE_V16_FLOAT 0x00000003
-#define NV30_3D_VTXFMT_TYPE_U8_UNORM 0x00000004
-#define NV30_3D_VTXFMT_TYPE_V16_SSCALED 0x00000005
-#define NV30_3D_VTXFMT_TYPE_U8_USCALED 0x00000007
-#define NV30_3D_VTXFMT_SIZE__MASK 0x000000f0
-#define NV30_3D_VTXFMT_SIZE__SHIFT 4
-#define NV30_3D_VTXFMT_STRIDE__MASK 0x0000ff00
-#define NV30_3D_VTXFMT_STRIDE__SHIFT 8
-
-#define NV30_3D_LIGHT_MODEL_BACK_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION 0x000017a0
-
-
-#define NV30_3D_LIGHT_MODEL_BACK_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION_R 0x000017a0
-
-#define NV30_3D_LIGHT_MODEL_BACK_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION_G 0x000017a4
-
-#define NV30_3D_LIGHT_MODEL_BACK_SIDE_PRODUCT_AMBIENT_PLUS_EMISSION_B 0x000017a8
-
-#define NV30_3D_COLOR_MATERIAL_BACK 0x000017b0
-
-
-#define NV30_3D_COLOR_MATERIAL_BACK_R 0x000017b0
-
-#define NV30_3D_COLOR_MATERIAL_BACK_G 0x000017b4
-
-#define NV30_3D_COLOR_MATERIAL_BACK_B 0x000017b8
-
-#define NV30_3D_COLOR_MATERIAL_BACK_A 0x000017bc
-
-#define NV30_3D_QUERY_RESET 0x000017c8
-
-#define NV30_3D_QUERY_ENABLE 0x000017cc
-
-#define NV30_3D_QUERY_GET 0x00001800
-#define NV30_3D_QUERY_GET_OFFSET__MASK 0x00ffffff
-#define NV30_3D_QUERY_GET_OFFSET__SHIFT 0
-#define NV30_3D_QUERY_GET_UNK24__MASK 0xff000000
-#define NV30_3D_QUERY_GET_UNK24__SHIFT 24
-
-#define NV30_3D_VERTEX_BEGIN_END 0x00001808
-#define NV30_3D_VERTEX_BEGIN_END_STOP 0x00000000
-#define NV30_3D_VERTEX_BEGIN_END_POINTS 0x00000001
-#define NV30_3D_VERTEX_BEGIN_END_LINES 0x00000002
-#define NV30_3D_VERTEX_BEGIN_END_LINE_LOOP 0x00000003
-#define NV30_3D_VERTEX_BEGIN_END_LINE_STRIP 0x00000004
-#define NV30_3D_VERTEX_BEGIN_END_TRIANGLES 0x00000005
-#define NV30_3D_VERTEX_BEGIN_END_TRIANGLE_STRIP 0x00000006
-#define NV30_3D_VERTEX_BEGIN_END_TRIANGLE_FAN 0x00000007
-#define NV30_3D_VERTEX_BEGIN_END_QUADS 0x00000008
-#define NV30_3D_VERTEX_BEGIN_END_QUAD_STRIP 0x00000009
-#define NV30_3D_VERTEX_BEGIN_END_POLYGON 0x0000000a
-
-#define NV30_3D_VB_ELEMENT_U16 0x0000180c
-#define NV30_3D_VB_ELEMENT_U16_0__MASK 0x0000ffff
-#define NV30_3D_VB_ELEMENT_U16_0__SHIFT 0
-#define NV30_3D_VB_ELEMENT_U16_1__MASK 0xffff0000
-#define NV30_3D_VB_ELEMENT_U16_1__SHIFT 16
-
-#define NV30_3D_VB_ELEMENT_U32 0x00001810
-
-#define NV30_3D_VB_VERTEX_BATCH 0x00001814
-#define NV30_3D_VB_VERTEX_BATCH_OFFSET__MASK 0x00ffffff
-#define NV30_3D_VB_VERTEX_BATCH_OFFSET__SHIFT 0
-#define NV30_3D_VB_VERTEX_BATCH_COUNT__MASK 0xff000000
-#define NV30_3D_VB_VERTEX_BATCH_COUNT__SHIFT 24
-
-#define NV30_3D_VERTEX_DATA 0x00001818
-
-#define NV30_3D_IDXBUF_OFFSET 0x0000181c
-
-#define NV30_3D_IDXBUF_FORMAT 0x00001820
-#define NV30_3D_IDXBUF_FORMAT_DMA1 0x00000001
-#define NV30_3D_IDXBUF_FORMAT_TYPE__MASK 0x000000f0
-#define NV30_3D_IDXBUF_FORMAT_TYPE__SHIFT 4
-#define NV30_3D_IDXBUF_FORMAT_TYPE_U32 0x00000000
-#define NV30_3D_IDXBUF_FORMAT_TYPE_U16 0x00000010
-
-#define NV30_3D_VB_INDEX_BATCH 0x00001824
-#define NV30_3D_VB_INDEX_BATCH_START__MASK 0x00ffffff
-#define NV30_3D_VB_INDEX_BATCH_START__SHIFT 0
-#define NV30_3D_VB_INDEX_BATCH_COUNT__MASK 0xff000000
-#define NV30_3D_VB_INDEX_BATCH_COUNT__SHIFT 24
-
-#define NV30_3D_POLYGON_MODE_FRONT 0x00001828
-#define NV30_3D_POLYGON_MODE_FRONT_POINT 0x00001b00
-#define NV30_3D_POLYGON_MODE_FRONT_LINE 0x00001b01
-#define NV30_3D_POLYGON_MODE_FRONT_FILL 0x00001b02
-
-#define NV30_3D_POLYGON_MODE_BACK 0x0000182c
-#define NV30_3D_POLYGON_MODE_BACK_POINT 0x00001b00
-#define NV30_3D_POLYGON_MODE_BACK_LINE 0x00001b01
-#define NV30_3D_POLYGON_MODE_BACK_FILL 0x00001b02
-
-#define NV30_3D_CULL_FACE 0x00001830
-#define NV30_3D_CULL_FACE_FRONT 0x00000404
-#define NV30_3D_CULL_FACE_BACK 0x00000405
-#define NV30_3D_CULL_FACE_FRONT_AND_BACK 0x00000408
-
-#define NV30_3D_FRONT_FACE 0x00001834
-#define NV30_3D_FRONT_FACE_CW 0x00000900
-#define NV30_3D_FRONT_FACE_CCW 0x00000901
-
-#define NV30_3D_POLYGON_SMOOTH_ENABLE 0x00001838
-
-#define NV30_3D_CULL_FACE_ENABLE 0x0000183c
-
-#define NV30_3D_TEX_PALETTE_OFFSET(i0) (0x00001840 + 0x4*(i0))
-#define NV30_3D_TEX_PALETTE_OFFSET__ESIZE 0x00000004
-#define NV30_3D_TEX_PALETTE_OFFSET__LEN 0x00000008
-
-#define NV40_3D_TEX_SIZE1(i0) (0x00001840 + 0x4*(i0))
-#define NV40_3D_TEX_SIZE1__ESIZE 0x00000004
-#define NV40_3D_TEX_SIZE1__LEN 0x00000008
-#define NV40_3D_TEX_SIZE1_DEPTH__MASK 0xfff00000
-#define NV40_3D_TEX_SIZE1_DEPTH__SHIFT 20
-#define NV40_3D_TEX_SIZE1_PITCH__MASK 0x0000ffff
-#define NV40_3D_TEX_SIZE1_PITCH__SHIFT 0
-
-#define NV30_3D_VTX_ATTR_2F(i0) (0x00001880 + 0x8*(i0))
-#define NV30_3D_VTX_ATTR_2F__ESIZE 0x00000008
-#define NV30_3D_VTX_ATTR_2F__LEN 0x00000010
-
-
-#define NV30_3D_VTX_ATTR_2F_X(i0) (0x00001880 + 0x8*(i0))
-
-#define NV30_3D_VTX_ATTR_2F_Y(i0) (0x00001884 + 0x8*(i0))
-
-#define NV30_3D_VTX_ATTR_2I(i0) (0x00001900 + 0x4*(i0))
-#define NV30_3D_VTX_ATTR_2I__ESIZE 0x00000004
-#define NV30_3D_VTX_ATTR_2I__LEN 0x00000010
-#define NV30_3D_VTX_ATTR_2I_X__MASK 0x0000ffff
-#define NV30_3D_VTX_ATTR_2I_X__SHIFT 0
-#define NV30_3D_VTX_ATTR_2I_Y__MASK 0xffff0000
-#define NV30_3D_VTX_ATTR_2I_Y__SHIFT 16
-
-#define NV30_3D_VTX_ATTR_4UB(i0) (0x00001940 + 0x4*(i0))
-#define NV30_3D_VTX_ATTR_4UB__ESIZE 0x00000004
-#define NV30_3D_VTX_ATTR_4UB__LEN 0x00000010
-#define NV30_3D_VTX_ATTR_4UB_X__MASK 0x000000ff
-#define NV30_3D_VTX_ATTR_4UB_X__SHIFT 0
-#define NV30_3D_VTX_ATTR_4UB_Y__MASK 0x0000ff00
-#define NV30_3D_VTX_ATTR_4UB_Y__SHIFT 8
-#define NV30_3D_VTX_ATTR_4UB_Z__MASK 0x00ff0000
-#define NV30_3D_VTX_ATTR_4UB_Z__SHIFT 16
-#define NV30_3D_VTX_ATTR_4UB_W__MASK 0xff000000
-#define NV30_3D_VTX_ATTR_4UB_W__SHIFT 24
-
-#define NV30_3D_VTX_ATTR_4I(i0) (0x00001980 + 0x8*(i0))
-#define NV30_3D_VTX_ATTR_4I__ESIZE 0x00000008
-#define NV30_3D_VTX_ATTR_4I__LEN 0x00000010
-
-#define NV30_3D_VTX_ATTR_4I_XY(i0) (0x00001980 + 0x8*(i0))
-#define NV30_3D_VTX_ATTR_4I_XY_X__MASK 0x0000ffff
-#define NV30_3D_VTX_ATTR_4I_XY_X__SHIFT 0
-#define NV30_3D_VTX_ATTR_4I_XY_Y__MASK 0xffff0000
-#define NV30_3D_VTX_ATTR_4I_XY_Y__SHIFT 16
-
-#define NV30_3D_VTX_ATTR_4I_ZW(i0) (0x00001984 + 0x8*(i0))
-#define NV30_3D_VTX_ATTR_4I_ZW_Z__MASK 0x0000ffff
-#define NV30_3D_VTX_ATTR_4I_ZW_Z__SHIFT 0
-#define NV30_3D_VTX_ATTR_4I_ZW_W__MASK 0xffff0000
-#define NV30_3D_VTX_ATTR_4I_ZW_W__SHIFT 16
-
-#define NV30_3D_TEX_OFFSET(i0) (0x00001a00 + 0x20*(i0))
-#define NV30_3D_TEX_OFFSET__ESIZE 0x00000020
-#define NV30_3D_TEX_OFFSET__LEN 0x00000008
-
-#define NV30_3D_TEX_FORMAT(i0) (0x00001a04 + 0x20*(i0))
-#define NV30_3D_TEX_FORMAT__ESIZE 0x00000020
-#define NV30_3D_TEX_FORMAT__LEN 0x00000008
-#define NV30_3D_TEX_FORMAT_DMA0 0x00000001
-#define NV30_3D_TEX_FORMAT_DMA1 0x00000002
-#define NV30_3D_TEX_FORMAT_CUBIC 0x00000004
-#define NV30_3D_TEX_FORMAT_NO_BORDER 0x00000008
-#define NV30_3D_TEX_FORMAT_DIMS__MASK 0x000000f0
-#define NV30_3D_TEX_FORMAT_DIMS__SHIFT 4
-#define NV30_3D_TEX_FORMAT_DIMS_1D 0x00000010
-#define NV30_3D_TEX_FORMAT_DIMS_2D 0x00000020
-#define NV30_3D_TEX_FORMAT_DIMS_3D 0x00000030
-#define NV30_3D_TEX_FORMAT_FORMAT__MASK 0x0000ff00
-#define NV30_3D_TEX_FORMAT_FORMAT__SHIFT 8
-#define NV30_3D_TEX_FORMAT_FORMAT_L8 0x00000000
-#define NV30_3D_TEX_FORMAT_FORMAT_I8 0x00000100
-#define NV30_3D_TEX_FORMAT_FORMAT_A1R5G5B5 0x00000200
-#define NV30_3D_TEX_FORMAT_FORMAT_A4R4G4B4 0x00000400
-#define NV30_3D_TEX_FORMAT_FORMAT_R5G6B5 0x00000500
-#define NV30_3D_TEX_FORMAT_FORMAT_A8R8G8B8 0x00000600
-#define NV30_3D_TEX_FORMAT_FORMAT_X8R8G8B8 0x00000700
-#define NV30_3D_TEX_FORMAT_FORMAT_INDEX8 0x00000b00
-#define NV30_3D_TEX_FORMAT_FORMAT_DXT1 0x00000c00
-#define NV30_3D_TEX_FORMAT_FORMAT_DXT3 0x00000e00
-#define NV30_3D_TEX_FORMAT_FORMAT_DXT5 0x00000f00
-#define NV30_3D_TEX_FORMAT_FORMAT_A1R5G5B5_RECT 0x00001000
-#define NV30_3D_TEX_FORMAT_FORMAT_R5G6B5_RECT 0x00001100
-#define NV30_3D_TEX_FORMAT_FORMAT_A8R8G8B8_RECT 0x00001200
-#define NV30_3D_TEX_FORMAT_FORMAT_L8_RECT 0x00001300
-#define NV30_3D_TEX_FORMAT_FORMAT_DSDT8_RECT 0x00001700
-#define NV30_3D_TEX_FORMAT_FORMAT_A8L8 0x00001a00
-#define NV30_3D_TEX_FORMAT_FORMAT_I8_RECT 0x00001b00
-#define NV30_3D_TEX_FORMAT_FORMAT_A4R4G4B4_RECT 0x00001d00
-#define NV30_3D_TEX_FORMAT_FORMAT_R8G8B8_RECT 0x00001e00
-#define NV30_3D_TEX_FORMAT_FORMAT_A8L8_RECT 0x00002000
-#define NV30_3D_TEX_FORMAT_FORMAT_Z24 0x00002a00
-#define NV30_3D_TEX_FORMAT_FORMAT_Z24_RECT 0x00002b00
-#define NV30_3D_TEX_FORMAT_FORMAT_Z16 0x00002c00
-#define NV30_3D_TEX_FORMAT_FORMAT_Z16_RECT 0x00002d00
-#define NV30_3D_TEX_FORMAT_FORMAT_DSDT8 0x00002800
-#define NV30_3D_TEX_FORMAT_FORMAT_HILO16 0x00003300
-#define NV30_3D_TEX_FORMAT_FORMAT_HILO16_RECT 0x00003600
-#define NV30_3D_TEX_FORMAT_FORMAT_HILO8 0x00004400
-#define NV30_3D_TEX_FORMAT_FORMAT_SIGNED_HILO8 0x00004500
-#define NV30_3D_TEX_FORMAT_FORMAT_HILO8_RECT 0x00004600
-#define NV30_3D_TEX_FORMAT_FORMAT_SIGNED_HILO8_RECT 0x00004700
-#define NV30_3D_TEX_FORMAT_FORMAT_A16 0x00003200
-#define NV30_3D_TEX_FORMAT_FORMAT_A16_RECT 0x00003500
-#define NV30_3D_TEX_FORMAT_FORMAT_UNK3F 0x00003f00
-#define NV30_3D_TEX_FORMAT_FORMAT_FLOAT_RGBA16_NV 0x00004a00
-#define NV30_3D_TEX_FORMAT_FORMAT_FLOAT_RGBA32_NV 0x00004b00
-#define NV30_3D_TEX_FORMAT_FORMAT_FLOAT_R32_NV 0x00004c00
-#define NV40_3D_TEX_FORMAT_FORMAT__MASK 0x00001f00
-#define NV40_3D_TEX_FORMAT_FORMAT__SHIFT 8
-#define NV40_3D_TEX_FORMAT_FORMAT_L8 0x00000100
-#define NV40_3D_TEX_FORMAT_FORMAT_A1R5G5B5 0x00000200
-#define NV40_3D_TEX_FORMAT_FORMAT_A4R4G4B4 0x00000300
-#define NV40_3D_TEX_FORMAT_FORMAT_R5G6B5 0x00000400
-#define NV40_3D_TEX_FORMAT_FORMAT_A8R8G8B8 0x00000500
-#define NV40_3D_TEX_FORMAT_FORMAT_DXT1 0x00000600
-#define NV40_3D_TEX_FORMAT_FORMAT_DXT3 0x00000700
-#define NV40_3D_TEX_FORMAT_FORMAT_DXT5 0x00000800
-#define NV40_3D_TEX_FORMAT_FORMAT_A8L8 0x00000b00
-#define NV40_3D_TEX_FORMAT_FORMAT_Z24 0x00001000
-#define NV40_3D_TEX_FORMAT_FORMAT_Z16 0x00001200
-#define NV40_3D_TEX_FORMAT_FORMAT_A16 0x00001400
-#define NV40_3D_TEX_FORMAT_FORMAT_A16L16 0x00001500
-#define NV40_3D_TEX_FORMAT_FORMAT_HILO8 0x00001800
-#define NV40_3D_TEX_FORMAT_FORMAT_RGBA16F 0x00001a00
-#define NV40_3D_TEX_FORMAT_FORMAT_RGBA32F 0x00001b00
-#define NV40_3D_TEX_FORMAT_LINEAR 0x00002000
-#define NV40_3D_TEX_FORMAT_RECT 0x00004000
-#define NV40_3D_TEX_FORMAT_MIPMAP_COUNT__MASK 0x000f0000
-#define NV40_3D_TEX_FORMAT_MIPMAP_COUNT__SHIFT 16
-#define NV30_3D_TEX_FORMAT_MIPMAP 0x00080000
-#define NV30_3D_TEX_FORMAT_BASE_SIZE_U__MASK 0x00f00000
-#define NV30_3D_TEX_FORMAT_BASE_SIZE_U__SHIFT 20
-#define NV30_3D_TEX_FORMAT_BASE_SIZE_V__MASK 0x0f000000
-#define NV30_3D_TEX_FORMAT_BASE_SIZE_V__SHIFT 24
-#define NV30_3D_TEX_FORMAT_BASE_SIZE_W__MASK 0xf0000000
-#define NV30_3D_TEX_FORMAT_BASE_SIZE_W__SHIFT 28
-
-#define NV30_3D_TEX_WRAP(i0) (0x00001a08 + 0x20*(i0))
-#define NV30_3D_TEX_WRAP__ESIZE 0x00000020
-#define NV30_3D_TEX_WRAP__LEN 0x00000008
-#define NV30_3D_TEX_WRAP_S__MASK 0x000000ff
-#define NV30_3D_TEX_WRAP_S__SHIFT 0
-#define NV30_3D_TEX_WRAP_S_REPEAT 0x00000001
-#define NV30_3D_TEX_WRAP_S_MIRRORED_REPEAT 0x00000002
-#define NV30_3D_TEX_WRAP_S_CLAMP_TO_EDGE 0x00000003
-#define NV30_3D_TEX_WRAP_S_CLAMP_TO_BORDER 0x00000004
-#define NV30_3D_TEX_WRAP_S_CLAMP 0x00000005
-#define NV40_3D_TEX_WRAP_S_MIRROR_CLAMP_TO_EDGE 0x00000006
-#define NV40_3D_TEX_WRAP_S_MIRROR_CLAMP_TO_BORDER 0x00000007
-#define NV40_3D_TEX_WRAP_S_MIRROR_CLAMP 0x00000008
-#define NV40_3D_TEX_WRAP_ANISO_MIP_FILTER_OPTIMIZATION__MASK 0x00000070
-#define NV40_3D_TEX_WRAP_ANISO_MIP_FILTER_OPTIMIZATION__SHIFT 4
-#define NV40_3D_TEX_WRAP_ANISO_MIP_FILTER_OPTIMIZATION_OFF 0x00000000
-#define NV40_3D_TEX_WRAP_ANISO_MIP_FILTER_OPTIMIZATION_QUALITY 0x00000020
-#define NV40_3D_TEX_WRAP_ANISO_MIP_FILTER_OPTIMIZATION_PERFORMANCE 0x00000030
-#define NV40_3D_TEX_WRAP_ANISO_MIP_FILTER_OPTIMIZATION_HIGH_PERFORMANCE 0x00000070
-#define NV30_3D_TEX_WRAP_T__MASK 0x00000f00
-#define NV30_3D_TEX_WRAP_T__SHIFT 8
-#define NV30_3D_TEX_WRAP_T_REPEAT 0x00000100
-#define NV30_3D_TEX_WRAP_T_MIRRORED_REPEAT 0x00000200
-#define NV30_3D_TEX_WRAP_T_CLAMP_TO_EDGE 0x00000300
-#define NV30_3D_TEX_WRAP_T_CLAMP_TO_BORDER 0x00000400
-#define NV30_3D_TEX_WRAP_T_CLAMP 0x00000500
-#define NV40_3D_TEX_WRAP_T_MIRROR_CLAMP_TO_EDGE 0x00000600
-#define NV40_3D_TEX_WRAP_T_MIRROR_CLAMP_TO_BORDER 0x00000700
-#define NV40_3D_TEX_WRAP_T_MIRROR_CLAMP 0x00000800
-#define NV30_3D_TEX_WRAP_EXPAND_NORMAL 0x0000f000
-#define NV30_3D_TEX_WRAP_R__MASK 0x000f0000
-#define NV30_3D_TEX_WRAP_R__SHIFT 16
-#define NV30_3D_TEX_WRAP_R_REPEAT 0x00010000
-#define NV30_3D_TEX_WRAP_R_MIRRORED_REPEAT 0x00020000
-#define NV30_3D_TEX_WRAP_R_CLAMP_TO_EDGE 0x00030000
-#define NV30_3D_TEX_WRAP_R_CLAMP_TO_BORDER 0x00040000
-#define NV30_3D_TEX_WRAP_R_CLAMP 0x00050000
-#define NV40_3D_TEX_WRAP_R_MIRROR_CLAMP_TO_EDGE 0x00060000
-#define NV40_3D_TEX_WRAP_R_MIRROR_CLAMP_TO_BORDER 0x00070000
-#define NV40_3D_TEX_WRAP_R_MIRROR_CLAMP 0x00080000
-#define NV40_3D_TEX_WRAP_GAMMA_DECREASE_FILTER__MASK 0x00f00000
-#define NV40_3D_TEX_WRAP_GAMMA_DECREASE_FILTER__SHIFT 20
-#define NV40_3D_TEX_WRAP_GAMMA_DECREASE_FILTER_NONE 0x00000000
-#define NV40_3D_TEX_WRAP_GAMMA_DECREASE_FILTER_RED 0x00100000
-#define NV40_3D_TEX_WRAP_GAMMA_DECREASE_FILTER_GREEN 0x00200000
-#define NV40_3D_TEX_WRAP_GAMMA_DECREASE_FILTER_BLUE 0x00400000
-#define NV40_3D_TEX_WRAP_GAMMA_DECREASE_FILTER_ALL 0x00f00000
-#define NV30_3D_TEX_WRAP_RCOMP__MASK 0xf0000000
-#define NV30_3D_TEX_WRAP_RCOMP__SHIFT 28
-#define NV30_3D_TEX_WRAP_RCOMP_NEVER 0x00000000
-#define NV30_3D_TEX_WRAP_RCOMP_GREATER 0x10000000
-#define NV30_3D_TEX_WRAP_RCOMP_EQUAL 0x20000000
-#define NV30_3D_TEX_WRAP_RCOMP_GEQUAL 0x30000000
-#define NV30_3D_TEX_WRAP_RCOMP_LESS 0x40000000
-#define NV30_3D_TEX_WRAP_RCOMP_NOTEQUAL 0x50000000
-#define NV30_3D_TEX_WRAP_RCOMP_LEQUAL 0x60000000
-#define NV30_3D_TEX_WRAP_RCOMP_ALWAYS 0x70000000
-
-#define NV30_3D_TEX_ENABLE(i0) (0x00001a0c + 0x20*(i0))
-#define NV30_3D_TEX_ENABLE__ESIZE 0x00000020
-#define NV30_3D_TEX_ENABLE__LEN 0x00000008
-#define NV30_3D_TEX_ENABLE_ANISO__MASK 0x00000030
-#define NV30_3D_TEX_ENABLE_ANISO__SHIFT 4
-#define NV30_3D_TEX_ENABLE_ANISO_NONE 0x00000000
-#define NV30_3D_TEX_ENABLE_ANISO_2X 0x00000010
-#define NV30_3D_TEX_ENABLE_ANISO_4X 0x00000020
-#define NV30_3D_TEX_ENABLE_ANISO_8X 0x00000030
-#define NV40_3D_TEX_ENABLE_ANISO__MASK 0x000000f0
-#define NV40_3D_TEX_ENABLE_ANISO__SHIFT 4
-#define NV40_3D_TEX_ENABLE_ANISO_NONE 0x00000000
-#define NV40_3D_TEX_ENABLE_ANISO_2X 0x00000010
-#define NV40_3D_TEX_ENABLE_ANISO_4X 0x00000020
-#define NV40_3D_TEX_ENABLE_ANISO_6X 0x00000030
-#define NV40_3D_TEX_ENABLE_ANISO_8X 0x00000040
-#define NV40_3D_TEX_ENABLE_ANISO_10X 0x00000050
-#define NV40_3D_TEX_ENABLE_ANISO_12X 0x00000060
-#define NV40_3D_TEX_ENABLE_ANISO_16X 0x00000070
-#define NV30_3D_TEX_ENABLE_MIPMAP_MAX_LOD__MASK 0x0003c000
-#define NV30_3D_TEX_ENABLE_MIPMAP_MAX_LOD__SHIFT 14
-#define NV40_3D_TEX_ENABLE_MIPMAP_MAX_LOD__MASK 0x00038000
-#define NV40_3D_TEX_ENABLE_MIPMAP_MAX_LOD__SHIFT 15
-#define NV30_3D_TEX_ENABLE_MIPMAP_MIN_LOD__MASK 0x3c000000
-#define NV30_3D_TEX_ENABLE_MIPMAP_MIN_LOD__SHIFT 26
-#define NV40_3D_TEX_ENABLE_MIPMAP_MIN_LOD__MASK 0x38000000
-#define NV40_3D_TEX_ENABLE_MIPMAP_MIN_LOD__SHIFT 27
-#define NV30_3D_TEX_ENABLE_ENABLE 0x40000000
-#define NV40_3D_TEX_ENABLE_ENABLE 0x80000000
-
-#define NV30_3D_TEX_SWIZZLE(i0) (0x00001a10 + 0x20*(i0))
-#define NV30_3D_TEX_SWIZZLE__ESIZE 0x00000020
-#define NV30_3D_TEX_SWIZZLE__LEN 0x00000008
-#define NV30_3D_TEX_SWIZZLE_S1_W__MASK 0x00000003
-#define NV30_3D_TEX_SWIZZLE_S1_W__SHIFT 0
-#define NV30_3D_TEX_SWIZZLE_S1_W_W 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S1_W_Z 0x00000001
-#define NV30_3D_TEX_SWIZZLE_S1_W_Y 0x00000002
-#define NV30_3D_TEX_SWIZZLE_S1_W_X 0x00000003
-#define NV30_3D_TEX_SWIZZLE_S1_Z__MASK 0x0000000c
-#define NV30_3D_TEX_SWIZZLE_S1_Z__SHIFT 2
-#define NV30_3D_TEX_SWIZZLE_S1_Z_W 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S1_Z_Z 0x00000004
-#define NV30_3D_TEX_SWIZZLE_S1_Z_Y 0x00000008
-#define NV30_3D_TEX_SWIZZLE_S1_Z_X 0x0000000c
-#define NV30_3D_TEX_SWIZZLE_S1_Y__MASK 0x00000030
-#define NV30_3D_TEX_SWIZZLE_S1_Y__SHIFT 4
-#define NV30_3D_TEX_SWIZZLE_S1_Y_W 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S1_Y_Z 0x00000010
-#define NV30_3D_TEX_SWIZZLE_S1_Y_Y 0x00000020
-#define NV30_3D_TEX_SWIZZLE_S1_Y_X 0x00000030
-#define NV30_3D_TEX_SWIZZLE_S1_X__MASK 0x000000c0
-#define NV30_3D_TEX_SWIZZLE_S1_X__SHIFT 6
-#define NV30_3D_TEX_SWIZZLE_S1_X_W 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S1_X_Z 0x00000040
-#define NV30_3D_TEX_SWIZZLE_S1_X_Y 0x00000080
-#define NV30_3D_TEX_SWIZZLE_S1_X_X 0x000000c0
-#define NV30_3D_TEX_SWIZZLE_S0_W__MASK 0x00000300
-#define NV30_3D_TEX_SWIZZLE_S0_W__SHIFT 8
-#define NV30_3D_TEX_SWIZZLE_S0_W_ZERO 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S0_W_ONE 0x00000100
-#define NV30_3D_TEX_SWIZZLE_S0_W_S1 0x00000200
-#define NV30_3D_TEX_SWIZZLE_S0_Z__MASK 0x00000c00
-#define NV30_3D_TEX_SWIZZLE_S0_Z__SHIFT 10
-#define NV30_3D_TEX_SWIZZLE_S0_Z_ZERO 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S0_Z_ONE 0x00000400
-#define NV30_3D_TEX_SWIZZLE_S0_Z_S1 0x00000800
-#define NV30_3D_TEX_SWIZZLE_S0_Y__MASK 0x00003000
-#define NV30_3D_TEX_SWIZZLE_S0_Y__SHIFT 12
-#define NV30_3D_TEX_SWIZZLE_S0_Y_ZERO 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S0_Y_ONE 0x00001000
-#define NV30_3D_TEX_SWIZZLE_S0_Y_S1 0x00002000
-#define NV30_3D_TEX_SWIZZLE_S0_X__MASK 0x0000c000
-#define NV30_3D_TEX_SWIZZLE_S0_X__SHIFT 14
-#define NV30_3D_TEX_SWIZZLE_S0_X_ZERO 0x00000000
-#define NV30_3D_TEX_SWIZZLE_S0_X_ONE 0x00004000
-#define NV30_3D_TEX_SWIZZLE_S0_X_S1 0x00008000
-#define NV30_3D_TEX_SWIZZLE_RECT_PITCH__MASK 0xffff0000
-#define NV30_3D_TEX_SWIZZLE_RECT_PITCH__SHIFT 16
-
-#define NV30_3D_TEX_FILTER(i0) (0x00001a14 + 0x20*(i0))
-#define NV30_3D_TEX_FILTER__ESIZE 0x00000020
-#define NV30_3D_TEX_FILTER__LEN 0x00000008
-#define NV30_3D_TEX_FILTER_LOD_BIAS__MASK 0x00000f00
-#define NV30_3D_TEX_FILTER_LOD_BIAS__SHIFT 8
-#define NV30_3D_TEX_FILTER_MIN__MASK 0x000f0000
-#define NV30_3D_TEX_FILTER_MIN__SHIFT 16
-#define NV30_3D_TEX_FILTER_MIN_NEAREST 0x00010000
-#define NV30_3D_TEX_FILTER_MIN_LINEAR 0x00020000
-#define NV30_3D_TEX_FILTER_MIN_NEAREST_MIPMAP_NEAREST 0x00030000
-#define NV30_3D_TEX_FILTER_MIN_LINEAR_MIPMAP_NEAREST 0x00040000
-#define NV30_3D_TEX_FILTER_MIN_NEAREST_MIPMAP_LINEAR 0x00050000
-#define NV30_3D_TEX_FILTER_MIN_LINEAR_MIPMAP_LINEAR 0x00060000
-#define NV30_3D_TEX_FILTER_MAG__MASK 0x0f000000
-#define NV30_3D_TEX_FILTER_MAG__SHIFT 24
-#define NV30_3D_TEX_FILTER_MAG_NEAREST 0x01000000
-#define NV30_3D_TEX_FILTER_MAG_LINEAR 0x02000000
-#define NV30_3D_TEX_FILTER_SIGNED_BLUE 0x10000000
-#define NV30_3D_TEX_FILTER_SIGNED_GREEN 0x20000000
-#define NV30_3D_TEX_FILTER_SIGNED_RED 0x40000000
-#define NV30_3D_TEX_FILTER_SIGNED_ALPHA 0x80000000
-
-#define NV30_3D_TEX_NPOT_SIZE(i0) (0x00001a18 + 0x20*(i0))
-#define NV30_3D_TEX_NPOT_SIZE__ESIZE 0x00000020
-#define NV30_3D_TEX_NPOT_SIZE__LEN 0x00000008
-#define NV30_3D_TEX_NPOT_SIZE_H__MASK 0x0000ffff
-#define NV30_3D_TEX_NPOT_SIZE_H__SHIFT 0
-#define NV30_3D_TEX_NPOT_SIZE_W__MASK 0xffff0000
-#define NV30_3D_TEX_NPOT_SIZE_W__SHIFT 16
-
-#define NV30_3D_TEX_BORDER_COLOR(i0) (0x00001a1c + 0x20*(i0))
-#define NV30_3D_TEX_BORDER_COLOR__ESIZE 0x00000020
-#define NV30_3D_TEX_BORDER_COLOR__LEN 0x00000008
-#define NV30_3D_TEX_BORDER_COLOR_B__MASK 0x000000ff
-#define NV30_3D_TEX_BORDER_COLOR_B__SHIFT 0
-#define NV30_3D_TEX_BORDER_COLOR_G__MASK 0x0000ff00
-#define NV30_3D_TEX_BORDER_COLOR_G__SHIFT 8
-#define NV30_3D_TEX_BORDER_COLOR_R__MASK 0x00ff0000
-#define NV30_3D_TEX_BORDER_COLOR_R__SHIFT 16
-#define NV30_3D_TEX_BORDER_COLOR_A__MASK 0xff000000
-#define NV30_3D_TEX_BORDER_COLOR_A__SHIFT 24
-
-#define NV30_3D_VTX_ATTR_4F(i0) (0x00001c00 + 0x10*(i0))
-#define NV30_3D_VTX_ATTR_4F__ESIZE 0x00000010
-#define NV30_3D_VTX_ATTR_4F__LEN 0x00000010
-
-
-#define NV30_3D_VTX_ATTR_4F_X(i0) (0x00001c00 + 0x10*(i0))
-
-#define NV30_3D_VTX_ATTR_4F_Y(i0) (0x00001c04 + 0x10*(i0))
-
-#define NV30_3D_VTX_ATTR_4F_Z(i0) (0x00001c08 + 0x10*(i0))
-
-#define NV30_3D_VTX_ATTR_4F_W(i0) (0x00001c0c + 0x10*(i0))
-
-#define NV30_3D_FP_CONTROL 0x00001d60
-#define NV30_3D_FP_CONTROL_USED_REGS_MINUS1_DIV2__MASK 0x0000000f
-#define NV30_3D_FP_CONTROL_USED_REGS_MINUS1_DIV2__SHIFT 0
-#define NV30_3D_FP_CONTROL_USES_KIL 0x00000080
-#define NV40_3D_FP_CONTROL_KIL 0x00000080
-#define NV40_3D_FP_CONTROL_TEMP_COUNT__MASK 0xff000000
-#define NV40_3D_FP_CONTROL_TEMP_COUNT__SHIFT 24
-
-#define NV30_3D_DEPTH_CONTROL 0x00001d78
-#define NV30_3D_DEPTH_CONTROL_CLAMP 0x000000f0
-
-#define NV30_3D_MULTISAMPLE_CONTROL 0x00001d7c
-#define NV30_3D_MULTISAMPLE_CONTROL_ENABLE 0x00000001
-#define NV30_3D_MULTISAMPLE_CONTROL_SAMPLE_ALPHA_TO_COVERAGE 0x00000010
-#define NV30_3D_MULTISAMPLE_CONTROL_SAMPLE_ALPHA_TO_ONE 0x00000100
-#define NV30_3D_MULTISAMPLE_CONTROL_SAMPLE_COVERAGE__MASK 0xffff0000
-#define NV30_3D_MULTISAMPLE_CONTROL_SAMPLE_COVERAGE__SHIFT 16
-
-#define NV30_3D_COORD_CONVENTIONS 0x00001d88
-#define NV30_3D_COORD_CONVENTIONS_HEIGHT__MASK 0x00000fff
-#define NV30_3D_COORD_CONVENTIONS_HEIGHT__SHIFT 0
-#define NV30_3D_COORD_CONVENTIONS_ORIGIN__MASK 0x00001000
-#define NV30_3D_COORD_CONVENTIONS_ORIGIN__SHIFT 12
-#define NV30_3D_COORD_CONVENTIONS_ORIGIN_NORMAL 0x00000000
-#define NV30_3D_COORD_CONVENTIONS_ORIGIN_INVERTED 0x00001000
-#define NV30_3D_COORD_CONVENTIONS_CENTER__MASK 0x00010000
-#define NV30_3D_COORD_CONVENTIONS_CENTER__SHIFT 16
-#define NV30_3D_COORD_CONVENTIONS_CENTER_HALF_INTEGER 0x00000000
-#define NV30_3D_COORD_CONVENTIONS_CENTER_INTEGER 0x00010000
-
-#define NV30_3D_CLEAR_DEPTH_VALUE 0x00001d8c
-
-#define NV30_3D_CLEAR_COLOR_VALUE 0x00001d90
-#define NV30_3D_CLEAR_COLOR_VALUE_B__MASK 0x000000ff
-#define NV30_3D_CLEAR_COLOR_VALUE_B__SHIFT 0
-#define NV30_3D_CLEAR_COLOR_VALUE_G__MASK 0x0000ff00
-#define NV30_3D_CLEAR_COLOR_VALUE_G__SHIFT 8
-#define NV30_3D_CLEAR_COLOR_VALUE_R__MASK 0x00ff0000
-#define NV30_3D_CLEAR_COLOR_VALUE_R__SHIFT 16
-#define NV30_3D_CLEAR_COLOR_VALUE_A__MASK 0xff000000
-#define NV30_3D_CLEAR_COLOR_VALUE_A__SHIFT 24
-
-#define NV30_3D_CLEAR_BUFFERS 0x00001d94
-#define NV30_3D_CLEAR_BUFFERS_DEPTH 0x00000001
-#define NV30_3D_CLEAR_BUFFERS_STENCIL 0x00000002
-#define NV30_3D_CLEAR_BUFFERS_COLOR_R 0x00000010
-#define NV30_3D_CLEAR_BUFFERS_COLOR_G 0x00000020
-#define NV30_3D_CLEAR_BUFFERS_COLOR_B 0x00000040
-#define NV30_3D_CLEAR_BUFFERS_COLOR_A 0x00000080
-
-#define NV30_3D_DO_VERTICES 0x00001dac
-
-#define NV30_3D_LINE_STIPPLE_ENABLE 0x00001db4
-
-#define NV30_3D_LINE_STIPPLE_PATTERN 0x00001db8
-#define NV30_3D_LINE_STIPPLE_PATTERN_FACTOR__MASK 0x0000ffff
-#define NV30_3D_LINE_STIPPLE_PATTERN_FACTOR__SHIFT 0
-#define NV30_3D_LINE_STIPPLE_PATTERN_PATTERN__MASK 0xffff0000
-#define NV30_3D_LINE_STIPPLE_PATTERN_PATTERN__SHIFT 16
-
-#define NV30_3D_BACK_MATERIAL_SHININESS(i0) (0x00001e20 + 0x4*(i0))
-#define NV30_3D_BACK_MATERIAL_SHININESS__ESIZE 0x00000004
-#define NV30_3D_BACK_MATERIAL_SHININESS__LEN 0x00000006
-
-#define NV30_3D_VTX_ATTR_1F(i0) (0x00001e40 + 0x4*(i0))
-#define NV30_3D_VTX_ATTR_1F__ESIZE 0x00000004
-#define NV30_3D_VTX_ATTR_1F__LEN 0x00000010
-
-#define NV30_3D_ENGINE 0x00001e94
-#define NV30_3D_ENGINE_FP 0x00000001
-#define NV30_3D_ENGINE_VP 0x00000002
-#define NV30_3D_ENGINE_FIXED 0x00000004
-
-#define NV30_3D_VP_UPLOAD_FROM_ID 0x00001e9c
-
-#define NV30_3D_VP_START_FROM_ID 0x00001ea0
-
-#define NV30_3D_POINT_PARAMETERS(i0) (0x00001ec0 + 0x4*(i0))
-#define NV30_3D_POINT_PARAMETERS__ESIZE 0x00000004
-#define NV30_3D_POINT_PARAMETERS__LEN 0x00000008
-
-#define NV30_3D_POINT_SIZE 0x00001ee0
-
-#define NV30_3D_POINT_PARAMETERS_ENABLE 0x00001ee4
-
-#define NV30_3D_POINT_SPRITE 0x00001ee8
-#define NV30_3D_POINT_SPRITE_ENABLE 0x00000001
-#define NV30_3D_POINT_SPRITE_R_MODE__MASK 0x00000006
-#define NV30_3D_POINT_SPRITE_R_MODE__SHIFT 1
-#define NV30_3D_POINT_SPRITE_R_MODE_ZERO 0x00000000
-#define NV30_3D_POINT_SPRITE_R_MODE_R 0x00000002
-#define NV30_3D_POINT_SPRITE_R_MODE_S 0x00000004
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_0 0x00000100
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_1 0x00000200
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_2 0x00000400
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_3 0x00000800
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_4 0x00001000
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_5 0x00002000
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_6 0x00004000
-#define NV30_3D_POINT_SPRITE_COORD_REPLACE_7 0x00008000
-
-#define NV30_3D_VP_UPLOAD_CONST_ID 0x00001efc
-
-#define NV30_3D_VP_UPLOAD_CONST(i0) (0x00001f00 + 0x10*(i0))
-#define NV30_3D_VP_UPLOAD_CONST__ESIZE 0x00000010
-#define NV30_3D_VP_UPLOAD_CONST__LEN 0x00000004
-
-
-#define NV30_3D_VP_UPLOAD_CONST_X(i0) (0x00001f00 + 0x10*(i0))
-
-#define NV30_3D_VP_UPLOAD_CONST_Y(i0) (0x00001f04 + 0x10*(i0))
-
-#define NV30_3D_VP_UPLOAD_CONST_Z(i0) (0x00001f08 + 0x10*(i0))
-
-#define NV30_3D_VP_UPLOAD_CONST_W(i0) (0x00001f0c + 0x10*(i0))
-
-#define NV30_3D_UNK1F80(i0) (0x00001f80 + 0x4*(i0))
-#define NV30_3D_UNK1F80__ESIZE 0x00000004
-#define NV30_3D_UNK1F80__LEN 0x00000010
-
-#define NV40_3D_TEX_CACHE_CTL 0x00001fd8
-
-#define NV40_3D_VP_ATTRIB_EN 0x00001ff0
-
-#define NV40_3D_VP_RESULT_EN 0x00001ff4
-
-
-#endif /* NV30_40_3D_XML */
+++ /dev/null
-#include "util/u_format.h"
-
-#include "nvfx_context.h"
-#include "nvfx_tex.h"
-#include "nvfx_resource.h"
-
-void
-nv30_sampler_state_init(struct pipe_context *pipe,
- struct nvfx_sampler_state *ps,
- const struct pipe_sampler_state *cso)
-{
- if (cso->max_anisotropy >= 2)
- {
- if (cso->max_anisotropy >= 8)
- ps->en |= NV30_3D_TEX_ENABLE_ANISO_8X;
- else if (cso->max_anisotropy >= 4)
- ps->en |= NV30_3D_TEX_ENABLE_ANISO_4X;
- else if (cso->max_anisotropy >= 2)
- ps->en |= NV30_3D_TEX_ENABLE_ANISO_2X;
- }
-
- ps->filt |= (int)(cso->lod_bias * 256.0) & 0x1fff;
-
- ps->max_lod = (int)CLAMP(cso->max_lod, 0.0, 15.0);
- ps->min_lod = (int)CLAMP(cso->min_lod, 0.0, 15.0);
-
- ps->en |= NV30_3D_TEX_ENABLE_ENABLE;
-}
-
-void
-nv30_sampler_view_init(struct pipe_context *pipe,
- struct nvfx_sampler_view *sv)
-{
- struct pipe_resource* pt = sv->base.texture;
- struct nvfx_texture_format *tf = &nvfx_texture_formats[sv->base.format];
- unsigned txf;
- unsigned level = pt->target == PIPE_TEXTURE_CUBE ? 0 : sv->base.u.tex.first_level;
-
- assert(tf->fmt[0] >= 0);
-
- txf = sv->u.init_fmt;
- txf |= (level != sv->base.u.tex.last_level ? NV30_3D_TEX_FORMAT_MIPMAP : 0);
- txf |= util_logbase2(u_minify(pt->width0, level)) << NV30_3D_TEX_FORMAT_BASE_SIZE_U__SHIFT;
- txf |= util_logbase2(u_minify(pt->height0, level)) << NV30_3D_TEX_FORMAT_BASE_SIZE_V__SHIFT;
- txf |= util_logbase2(u_minify(pt->depth0, level)) << NV30_3D_TEX_FORMAT_BASE_SIZE_W__SHIFT;
- txf |= 0x10000;
-
- sv->u.nv30.fmt[0] = tf->fmt[0] | txf;
- sv->u.nv30.fmt[1] = tf->fmt[1] | txf;
- sv->u.nv30.fmt[2] = tf->fmt[2] | txf;
- sv->u.nv30.fmt[3] = tf->fmt[3] | txf;
-
- sv->swizzle |= (nvfx_subresource_pitch(pt, 0) << NV30_3D_TEX_SWIZZLE_RECT_PITCH__SHIFT);
-
- if(pt->height0 <= 1 || util_format_is_compressed(sv->base.format))
- sv->u.nv30.rect = -1;
- else
- sv->u.nv30.rect = !!(pt->flags & NOUVEAU_RESOURCE_FLAG_LINEAR);
-
- sv->lod_offset = sv->base.u.tex.first_level - level;
- sv->max_lod_limit = sv->base.u.tex.last_level - level;
-}
-
-void
-nv30_fragtex_set(struct nvfx_context *nvfx, int unit)
-{
- struct nvfx_sampler_state *ps = nvfx->tex_sampler[unit];
- struct nvfx_sampler_view* sv = (struct nvfx_sampler_view*)nvfx->fragment_sampler_views[unit];
- struct nouveau_bo *bo = ((struct nvfx_miptree *)sv->base.texture)->base.bo;
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- unsigned txf;
- unsigned tex_flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_GART | NOUVEAU_BO_RD;
- unsigned use_rect;
- unsigned max_lod = MIN2(ps->max_lod + sv->lod_offset, sv->max_lod_limit);
- unsigned min_lod = MIN2(ps->min_lod + sv->lod_offset, max_lod) ;
-
- if(sv->u.nv30.rect < 0)
- {
- /* in the case of compressed or 1D textures, we can get away with this,
- * since the layout is the same
- */
- use_rect = ps->fmt;
- }
- else
- {
- static boolean warned = FALSE;
- if( !!ps->fmt != sv->u.nv30.rect && !warned) {
- warned = TRUE;
- fprintf(stderr,
- "Unimplemented: coordinate normalization mismatch. Possible reasons:\n"
- "1. ARB_texture_non_power_of_two is being used despite the fact it isn't supported\n"
- "2. The state tracker is not using the appropriate coordinate normalization\n"
- "3. The state tracker is not supported\n");
- }
-
- use_rect = sv->u.nv30.rect;
- }
-
- txf = sv->u.nv30.fmt[ps->compare + (use_rect ? 2 : 0)];
-
- MARK_RING(chan, 9, 2);
- BEGIN_RING(chan, eng3d, NV30_3D_TEX_OFFSET(unit), 8);
- OUT_RELOC(chan, bo, sv->offset, tex_flags | NOUVEAU_BO_LOW, 0, 0);
- OUT_RELOC(chan, bo, txf,
- tex_flags | NOUVEAU_BO_OR,
- NV30_3D_TEX_FORMAT_DMA0, NV30_3D_TEX_FORMAT_DMA1);
- OUT_RING(chan, (ps->wrap & sv->wrap_mask) | sv->wrap);
- OUT_RING(chan, ps->en | (min_lod << NV30_3D_TEX_ENABLE_MIPMAP_MIN_LOD__SHIFT) | (max_lod << NV30_3D_TEX_ENABLE_MIPMAP_MAX_LOD__SHIFT));
- OUT_RING(chan, sv->swizzle);
- OUT_RING(chan, ps->filt | sv->filt);
- OUT_RING(chan, sv->npot_size);
- OUT_RING(chan, ps->bcol);
-
- nvfx->hw_txf[unit] = txf;
- nvfx->hw_samplers |= (1 << unit);
-}
+++ /dev/null
-#ifndef __NV30_SHADER_H__
-#define __NV30_SHADER_H__
-
-/* Vertex programs instruction set
- *
- * 128bit opcodes, split into 4 32-bit ones for ease of use.
- *
- * Non-native instructions
- * ABS - MOV + NV40_VP_INST0_DEST_ABS
- * POW - EX2 + MUL + LG2
- * SUB - ADD, second source negated
- * SWZ - MOV
- * XPD -
- *
- * Register access
- * - Only one INPUT can be accessed per-instruction (move extras into TEMPs)
- * - Only one CONST can be accessed per-instruction (move extras into TEMPs)
- *
- * Relative Addressing
- * According to the value returned for
- * MAX_PROGRAM_NATIVE_ADDRESS_REGISTERS_ARB
- *
- * there are only two address registers available. The destination in the
- * ARL instruction is set to TEMP <n> (The temp isn't actually written).
- *
- * When using vanilla ARB_v_p, the proprietary driver will squish both the
- * available ADDRESS regs into the first hardware reg in the X and Y
- * components.
- *
- * To use an address reg as an index into consts, the CONST_SRC is set to
- * (const_base + offset) and INDEX_CONST is set.
- *
- * To access the second address reg use ADDR_REG_SELECT_1. A particular
- * component of the address regs is selected with ADDR_SWZ.
- *
- * Only one address register can be accessed per instruction.
- *
- * Conditional execution (see NV_vertex_program{2,3} for details) Conditional
- * execution of an instruction is enabled by setting COND_TEST_ENABLE, and
- * selecting the condition which will allow the test to pass with
- * COND_{FL,LT,...}. It is possible to swizzle the values in the condition
- * register, which allows for testing against an individual component.
- *
- * Branching:
- *
- * The BRA/CAL instructions seem to follow a slightly different opcode
- * layout. The destination instruction ID (IADDR) overlaps a source field.
- * Instruction ID's seem to be numbered based on the UPLOAD_FROM_ID FIFO
- * command, and is incremented automatically on each UPLOAD_INST FIFO
- * command.
- *
- * Conditional branching is achieved by using the condition tests described
- * above. There doesn't appear to be dedicated looping instructions, but
- * this can be done using a temp reg + conditional branching.
- *
- * Subroutines may be uploaded before the main program itself, but the first
- * executed instruction is determined by the PROGRAM_START_ID FIFO command.
- *
- */
-
-/* DWORD 0 */
-
-/* guess that this is the same as nv40 */
-#define NV30_VP_INST_INDEX_INPUT (1 << 27)
-
-#define NV30_VP_INST_ADDR_REG_SELECT_1 (1 << 24)
-#define NV30_VP_INST_SRC2_ABS (1 << 23) /* guess */
-#define NV30_VP_INST_SRC1_ABS (1 << 22) /* guess */
-#define NV30_VP_INST_SRC0_ABS (1 << 21) /* guess */
-#define NV30_VP_INST_VEC_RESULT (1 << 20)
-#define NV30_VP_INST_DEST_TEMP_ID_SHIFT 16
-#define NV30_VP_INST_DEST_TEMP_ID_MASK (0x0F << 16)
-#define NV30_VP_INST_COND_UPDATE_ENABLE (1<<15)
-#define NV30_VP_INST_VEC_DEST_TEMP_MASK (0x1F << 16)
-#define NV30_VP_INST_COND_TEST_ENABLE (1<<14)
-#define NV30_VP_INST_COND_SHIFT 11
-#define NV30_VP_INST_COND_MASK (0x07 << 11)
-#define NV30_VP_INST_COND_SWZ_X_SHIFT 9
-#define NV30_VP_INST_COND_SWZ_X_MASK (0x03 << 9)
-#define NV30_VP_INST_COND_SWZ_Y_SHIFT 7
-#define NV30_VP_INST_COND_SWZ_Y_MASK (0x03 << 7)
-#define NV30_VP_INST_COND_SWZ_Z_SHIFT 5
-#define NV30_VP_INST_COND_SWZ_Z_MASK (0x03 << 5)
-#define NV30_VP_INST_COND_SWZ_W_SHIFT 3
-#define NV30_VP_INST_COND_SWZ_W_MASK (0x03 << 3)
-#define NV30_VP_INST_COND_SWZ_ALL_SHIFT 3
-#define NV30_VP_INST_COND_SWZ_ALL_MASK (0xFF << 3)
-#define NV30_VP_INST_ADDR_SWZ_SHIFT 1
-#define NV30_VP_INST_ADDR_SWZ_MASK (0x03 << 1)
-#define NV30_VP_INST_SCA_OPCODEH_SHIFT 0
-#define NV30_VP_INST_SCA_OPCODEH_MASK (0x01 << 0)
-
-/* DWORD 1 */
-#define NV30_VP_INST_SCA_OPCODEL_SHIFT 28
-#define NV30_VP_INST_SCA_OPCODEL_MASK (0x0F << 28)
-#define NV30_VP_INST_VEC_OPCODE_SHIFT 23
-#define NV30_VP_INST_VEC_OPCODE_MASK (0x1F << 23)
-#define NV30_VP_INST_CONST_SRC_SHIFT 14
-#define NV30_VP_INST_CONST_SRC_MASK (0xFF << 14)
-#define NV30_VP_INST_INPUT_SRC_SHIFT 9 /*NV20*/
-#define NV30_VP_INST_INPUT_SRC_MASK (0x0F << 9) /*NV20*/
-#define NV30_VP_INST_SRC0H_SHIFT 0 /*NV20*/
-#define NV30_VP_INST_SRC0H_MASK (0x1FF << 0) /*NV20*/
-
-/* Please note: the IADDR fields overlap other fields because they are used
- * only for branch instructions. See Branching: label above
- *
- * DWORD 2
- */
-#define NV30_VP_INST_SRC0L_SHIFT 26 /*NV20*/
-#define NV30_VP_INST_SRC0L_MASK (0x3F <<26) /* NV30_VP_SRC0_LOW_MASK << 26 */
-#define NV30_VP_INST_SRC1_SHIFT 11 /*NV20*/
-#define NV30_VP_INST_SRC1_MASK (0x7FFF<<11) /*NV20*/
-#define NV30_VP_INST_SRC2H_SHIFT 0 /*NV20*/
-#define NV30_VP_INST_SRC2H_MASK (0x7FF << 0) /* NV30_VP_SRC2_HIGH_MASK >> 4*/
-#define NV30_VP_INST_IADDR_SHIFT 2
-#define NV30_VP_INST_IADDR_MASK (0x1FF << 2) /* NV30_VP_SRC2_LOW_MASK << 28 */
-
-/* DWORD 3 */
-#define NV30_VP_INST_SRC2L_SHIFT 28 /*NV20*/
-#define NV30_VP_INST_SRC2L_MASK (0x0F <<28) /*NV20*/
-#define NV30_VP_INST_STEMP_WRITEMASK_SHIFT 24
-#define NV30_VP_INST_STEMP_WRITEMASK_MASK (0x0F << 24)
-#define NV30_VP_INST_VTEMP_WRITEMASK_SHIFT 20
-#define NV30_VP_INST_VTEMP_WRITEMASK_MASK (0x0F << 20)
-#define NV30_VP_INST_SDEST_WRITEMASK_SHIFT 16
-#define NV30_VP_INST_SDEST_WRITEMASK_MASK (0x0F << 16)
-#define NV30_VP_INST_VDEST_WRITEMASK_SHIFT 12 /*NV20*/
-#define NV30_VP_INST_VDEST_WRITEMASK_MASK (0x0F << 12) /*NV20*/
-#define NV30_VP_INST_DEST_SHIFT 2
-#define NV30_VP_INST_DEST_MASK (0x1F << 2)
-# define NV30_VP_INST_DEST_POS 0
-# define NV30_VP_INST_DEST_BFC0 1
-# define NV30_VP_INST_DEST_BFC1 2
-# define NV30_VP_INST_DEST_COL0 3
-# define NV30_VP_INST_DEST_COL1 4
-# define NV30_VP_INST_DEST_FOGC 5
-# define NV30_VP_INST_DEST_PSZ 6
-# define NV30_VP_INST_DEST_TC(n) (8+(n))
-# define NV30_VP_INST_DEST_CLP(n) (17 + (n))
-
-/* guess that this is the same as nv40 */
-#define NV30_VP_INST_INDEX_CONST (1 << 1)
-
-/* Useful to split the source selection regs into their pieces */
-#define NV30_VP_SRC0_HIGH_SHIFT 6
-#define NV30_VP_SRC0_HIGH_MASK 0x00007FC0
-#define NV30_VP_SRC0_LOW_MASK 0x0000003F
-#define NV30_VP_SRC2_HIGH_SHIFT 4
-#define NV30_VP_SRC2_HIGH_MASK 0x00007FF0
-#define NV30_VP_SRC2_LOW_MASK 0x0000000F
-
-
-/* Source-register definition - matches NV20 exactly */
-#define NV30_VP_SRC_NEGATE (1<<14)
-#define NV30_VP_SRC_SWZ_X_SHIFT 12
-#define NV30_VP_SRC_REG_SWZ_X_MASK (0x03 <<12)
-#define NV30_VP_SRC_SWZ_Y_SHIFT 10
-#define NV30_VP_SRC_REG_SWZ_Y_MASK (0x03 <<10)
-#define NV30_VP_SRC_SWZ_Z_SHIFT 8
-#define NV30_VP_SRC_REG_SWZ_Z_MASK (0x03 << 8)
-#define NV30_VP_SRC_SWZ_W_SHIFT 6
-#define NV30_VP_SRC_REG_SWZ_W_MASK (0x03 << 6)
-#define NV30_VP_SRC_REG_SWZ_ALL_SHIFT 6
-#define NV30_VP_SRC_REG_SWZ_ALL_MASK (0xFF << 6)
-#define NV30_VP_SRC_TEMP_SRC_SHIFT 2
-#define NV30_VP_SRC_REG_TEMP_ID_MASK (0x0F << 0)
-#define NV30_VP_SRC_REG_TYPE_SHIFT 0
-#define NV30_VP_SRC_REG_TYPE_MASK (0x03 << 0)
-#define NV30_VP_SRC_REG_TYPE_TEMP 1
-#define NV30_VP_SRC_REG_TYPE_INPUT 2
-#define NV30_VP_SRC_REG_TYPE_CONST 3 /* guess */
-
-#include "nvfx_shader.h"
-
-#endif
+++ /dev/null
-#include "util/u_format.h"
-#include "nvfx_context.h"
-#include "nvfx_tex.h"
-#include "nvfx_resource.h"
-
-void
-nv40_sampler_state_init(struct pipe_context *pipe,
- struct nvfx_sampler_state *ps,
- const struct pipe_sampler_state *cso)
-{
- if (cso->max_anisotropy >= 2) {
- /* no idea, binary driver sets it, works without it.. meh.. */
- ps->wrap |= (1 << 5);
-
- if (cso->max_anisotropy >= 16)
- ps->en |= NV40_3D_TEX_ENABLE_ANISO_16X;
- else if (cso->max_anisotropy >= 12)
- ps->en |= NV40_3D_TEX_ENABLE_ANISO_12X;
- else if (cso->max_anisotropy >= 10)
- ps->en |= NV40_3D_TEX_ENABLE_ANISO_10X;
- else if (cso->max_anisotropy >= 8)
- ps->en |= NV40_3D_TEX_ENABLE_ANISO_8X;
- else if (cso->max_anisotropy >= 6)
- ps->en |= NV40_3D_TEX_ENABLE_ANISO_6X;
- else if (cso->max_anisotropy >= 4)
- ps->en |= NV40_3D_TEX_ENABLE_ANISO_4X;
- else
- ps->en |= NV40_3D_TEX_ENABLE_ANISO_2X;
- }
-
- ps->filt |= (int)(cso->lod_bias * 256.0) & 0x1fff;
-
- ps->max_lod = (int)(CLAMP(cso->max_lod, 0.0, 15.0 + (255.0 / 256.0)) * 256.0);
- ps->min_lod = (int)(CLAMP(cso->min_lod, 0.0, 15.0 + (255.0 / 256.0)) * 256.0);
-
- ps->en |= NV40_3D_TEX_ENABLE_ENABLE;
-}
-
-void
-nv40_sampler_view_init(struct pipe_context *pipe,
- struct nvfx_sampler_view *sv)
-{
- struct pipe_resource* pt = sv->base.texture;
- struct nvfx_miptree* mt = (struct nvfx_miptree*)pt;
- struct nvfx_texture_format *tf = &nvfx_texture_formats[sv->base.format];
- unsigned txf;
- unsigned level = pt->target == PIPE_TEXTURE_CUBE ? 0 : sv->base.u.tex.first_level;
- assert(tf->fmt[4] >= 0);
-
- txf = sv->u.init_fmt;
- txf |= 0x8000;
- if(pt->target == PIPE_TEXTURE_CUBE)
- txf |= ((pt->last_level + 1) << NV40_3D_TEX_FORMAT_MIPMAP_COUNT__SHIFT);
- else
- txf |= (((sv->base.u.tex.last_level - sv->base.u.tex.first_level) + 1) << NV40_3D_TEX_FORMAT_MIPMAP_COUNT__SHIFT);
-
- if (!mt->linear_pitch)
- sv->u.nv40.npot_size2 = 0;
- else {
- sv->u.nv40.npot_size2 = mt->linear_pitch;
- txf |= NV40_3D_TEX_FORMAT_LINEAR;
- }
-
- sv->u.nv40.fmt[0] = tf->fmt[4] | txf;
- sv->u.nv40.fmt[1] = tf->fmt[5] | txf;
-
- sv->u.nv40.npot_size2 |= (u_minify(pt->depth0, level) << NV40_3D_TEX_SIZE1_DEPTH__SHIFT);
-
- sv->lod_offset = (sv->base.u.tex.first_level - level) * 256;
- sv->max_lod_limit = (sv->base.u.tex.last_level - level) * 256;
-}
-
-void
-nv40_fragtex_set(struct nvfx_context *nvfx, int unit)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct nvfx_sampler_state *ps = nvfx->tex_sampler[unit];
- struct nvfx_sampler_view* sv = (struct nvfx_sampler_view*)nvfx->fragment_sampler_views[unit];
- struct nouveau_bo *bo = ((struct nvfx_miptree *)sv->base.texture)->base.bo;
- unsigned tex_flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_GART | NOUVEAU_BO_RD;
- unsigned txf;
- unsigned max_lod = MIN2(ps->max_lod + sv->lod_offset, sv->max_lod_limit);
- unsigned min_lod = MIN2(ps->min_lod + sv->lod_offset, max_lod);
-
- txf = sv->u.nv40.fmt[ps->compare] | ps->fmt;
-
- MARK_RING(chan, 11, 2);
- BEGIN_RING(chan, eng3d, NV30_3D_TEX_OFFSET(unit), 8);
- OUT_RELOC(chan, bo, sv->offset, tex_flags | NOUVEAU_BO_LOW, 0, 0);
- OUT_RELOC(chan, bo, txf, tex_flags | NOUVEAU_BO_OR,
- NV30_3D_TEX_FORMAT_DMA0, NV30_3D_TEX_FORMAT_DMA1);
- OUT_RING(chan, (ps->wrap & sv->wrap_mask) | sv->wrap);
- OUT_RING(chan, ps->en | (min_lod << 19) | (max_lod << 7));
- OUT_RING(chan, sv->swizzle);
- OUT_RING(chan, ps->filt | sv->filt);
- OUT_RING(chan, sv->npot_size);
- OUT_RING(chan, ps->bcol);
- BEGIN_RING(chan, eng3d, NV40_3D_TEX_SIZE1(unit), 1);
- OUT_RING(chan, sv->u.nv40.npot_size2);
-
- nvfx->hw_txf[unit] = txf;
- nvfx->hw_samplers |= (1 << unit);
-}
+++ /dev/null
-#ifndef __NV40_SHADER_H__
-#define __NV40_SHADER_H__
-
-/* Vertex programs instruction set
- *
- * The NV40 instruction set is very similar to NV30. Most fields are in
- * a slightly different position in the instruction however.
- *
- * Merged instructions
- * In some cases it is possible to put two instructions into one opcode
- * slot. The rules for when this is OK is not entirely clear to me yet.
- *
- * There are separate writemasks and dest temp register fields for each
- * grouping of instructions. There is however only one field with the
- * ID of a result register. Writing to temp/result regs is selected by
- * setting VEC_RESULT/SCA_RESULT.
- *
- * Temporary registers
- * The source/dest temp register fields have been extended by 1 bit, to
- * give a total of 32 temporary registers.
- *
- * Relative Addressing
- * NV40 can use an address register to index into vertex attribute regs.
- * This is done by putting the offset value into INPUT_SRC and setting
- * the INDEX_INPUT flag.
- *
- * Conditional execution (see NV_vertex_program{2,3} for details)
- * There is a second condition code register on NV40, it's use is enabled
- * by setting the COND_REG_SELECT_1 flag.
- *
- * Texture lookup
- * TODO
- */
-
-/* ---- OPCODE BITS 127:96 / data DWORD 0 --- */
-#define NV40_VP_INST_VEC_RESULT (1 << 30)
-/* uncertain.. */
-#define NV40_VP_INST_COND_UPDATE_ENABLE ((1 << 14)|1<<29)
-/* use address reg as index into attribs */
-#define NV40_VP_INST_INDEX_INPUT (1 << 27)
-#define NV40_VP_INST_SATURATE (1 << 26)
-#define NV40_VP_INST_COND_REG_SELECT_1 (1 << 25)
-#define NV40_VP_INST_ADDR_REG_SELECT_1 (1 << 24)
-#define NV40_VP_INST_SRC2_ABS (1 << 23)
-#define NV40_VP_INST_SRC1_ABS (1 << 22)
-#define NV40_VP_INST_SRC0_ABS (1 << 21)
-#define NV40_VP_INST_VEC_DEST_TEMP_SHIFT 15
-#define NV40_VP_INST_VEC_DEST_TEMP_MASK (0x3F << 15)
-#define NV40_VP_INST_COND_TEST_ENABLE (1 << 13)
-#define NV40_VP_INST_COND_SHIFT 10
-#define NV40_VP_INST_COND_MASK (0x7 << 10)
-#define NV40_VP_INST_COND_SWZ_X_SHIFT 8
-#define NV40_VP_INST_COND_SWZ_X_MASK (3 << 8)
-#define NV40_VP_INST_COND_SWZ_Y_SHIFT 6
-#define NV40_VP_INST_COND_SWZ_Y_MASK (3 << 6)
-#define NV40_VP_INST_COND_SWZ_Z_SHIFT 4
-#define NV40_VP_INST_COND_SWZ_Z_MASK (3 << 4)
-#define NV40_VP_INST_COND_SWZ_W_SHIFT 2
-#define NV40_VP_INST_COND_SWZ_W_MASK (3 << 2)
-#define NV40_VP_INST_COND_SWZ_ALL_SHIFT 2
-#define NV40_VP_INST_COND_SWZ_ALL_MASK (0xFF << 2)
-#define NV40_VP_INST_ADDR_SWZ_SHIFT 0
-#define NV40_VP_INST_ADDR_SWZ_MASK (0x03 << 0)
-#define NV40_VP_INST0_KNOWN ( \
- NV40_VP_INST_INDEX_INPUT | \
- NV40_VP_INST_COND_REG_SELECT_1 | \
- NV40_VP_INST_ADDR_REG_SELECT_1 | \
- NV40_VP_INST_SRC2_ABS | \
- NV40_VP_INST_SRC1_ABS | \
- NV40_VP_INST_SRC0_ABS | \
- NV40_VP_INST_VEC_DEST_TEMP_MASK | \
- NV40_VP_INST_COND_TEST_ENABLE | \
- NV40_VP_INST_COND_MASK | \
- NV40_VP_INST_COND_SWZ_ALL_MASK | \
- NV40_VP_INST_ADDR_SWZ_MASK)
-
-/* ---- OPCODE BITS 95:64 / data DWORD 1 --- */
-#define NV40_VP_INST_VEC_OPCODE_SHIFT 22
-#define NV40_VP_INST_VEC_OPCODE_MASK (0x1F << 22)
-#define NV40_VP_INST_SCA_OPCODE_SHIFT 27
-#define NV40_VP_INST_SCA_OPCODE_MASK (0x1F << 27)
-#define NV40_VP_INST_CONST_SRC_SHIFT 12
-#define NV40_VP_INST_CONST_SRC_MASK (0xFF << 12)
-#define NV40_VP_INST_INPUT_SRC_SHIFT 8
-#define NV40_VP_INST_INPUT_SRC_MASK (0x0F << 8)
-#define NV40_VP_INST_SRC0H_SHIFT 0
-#define NV40_VP_INST_SRC0H_MASK (0xFF << 0)
-#define NV40_VP_INST1_KNOWN ( \
- NV40_VP_INST_VEC_OPCODE_MASK | \
- NV40_VP_INST_SCA_OPCODE_MASK | \
- NV40_VP_INST_CONST_SRC_MASK | \
- NV40_VP_INST_INPUT_SRC_MASK | \
- NV40_VP_INST_SRC0H_MASK \
- )
-
-/* ---- OPCODE BITS 63:32 / data DWORD 2 --- */
-#define NV40_VP_INST_SRC0L_SHIFT 23
-#define NV40_VP_INST_SRC0L_MASK (0x1FF << 23)
-#define NV40_VP_INST_SRC1_SHIFT 6
-#define NV40_VP_INST_SRC1_MASK (0x1FFFF << 6)
-#define NV40_VP_INST_SRC2H_SHIFT 0
-#define NV40_VP_INST_SRC2H_MASK (0x3F << 0)
-#define NV40_VP_INST_IADDRH_SHIFT 0
-#define NV40_VP_INST_IADDRH_MASK (0x3F << 0)
-
-/* ---- OPCODE BITS 31:0 / data DWORD 3 --- */
-#define NV40_VP_INST_IADDRL_SHIFT 29
-#define NV40_VP_INST_IADDRL_MASK (7 << 29)
-#define NV40_VP_INST_SRC2L_SHIFT 21
-#define NV40_VP_INST_SRC2L_MASK (0x7FF << 21)
-#define NV40_VP_INST_SCA_WRITEMASK_SHIFT 17
-#define NV40_VP_INST_SCA_WRITEMASK_MASK (0xF << 17)
-# define NV40_VP_INST_SCA_WRITEMASK_X (1 << 20)
-# define NV40_VP_INST_SCA_WRITEMASK_Y (1 << 19)
-# define NV40_VP_INST_SCA_WRITEMASK_Z (1 << 18)
-# define NV40_VP_INST_SCA_WRITEMASK_W (1 << 17)
-#define NV40_VP_INST_VEC_WRITEMASK_SHIFT 13
-#define NV40_VP_INST_VEC_WRITEMASK_MASK (0xF << 13)
-# define NV40_VP_INST_VEC_WRITEMASK_X (1 << 16)
-# define NV40_VP_INST_VEC_WRITEMASK_Y (1 << 15)
-# define NV40_VP_INST_VEC_WRITEMASK_Z (1 << 14)
-# define NV40_VP_INST_VEC_WRITEMASK_W (1 << 13)
-#define NV40_VP_INST_SCA_RESULT (1 << 12)
-#define NV40_VP_INST_SCA_DEST_TEMP_SHIFT 7
-#define NV40_VP_INST_SCA_DEST_TEMP_MASK (0x1F << 7)
-#define NV40_VP_INST_DEST_SHIFT 2
-#define NV40_VP_INST_DEST_MASK (31 << 2)
-# define NV40_VP_INST_DEST_POS 0
-# define NV40_VP_INST_DEST_COL0 1
-# define NV40_VP_INST_DEST_COL1 2
-# define NV40_VP_INST_DEST_BFC0 3
-# define NV40_VP_INST_DEST_BFC1 4
-# define NV40_VP_INST_DEST_FOGC 5
-# define NV40_VP_INST_DEST_PSZ 6
-# define NV40_VP_INST_DEST_TC0 7
-# define NV40_VP_INST_DEST_TC(n) (7+n)
-# define NV40_VP_INST_DEST_TEMP 0x1F
-#define NV40_VP_INST_INDEX_CONST (1 << 1)
-#define NV40_VP_INST3_KNOWN ( \
- NV40_VP_INST_SRC2L_MASK |\
- NV40_VP_INST_SCA_WRITEMASK_MASK |\
- NV40_VP_INST_VEC_WRITEMASK_MASK |\
- NV40_VP_INST_SCA_DEST_TEMP_MASK |\
- NV40_VP_INST_DEST_MASK |\
- NV40_VP_INST_INDEX_CONST)
-
-/* Useful to split the source selection regs into their pieces */
-#define NV40_VP_SRC0_HIGH_SHIFT 9
-#define NV40_VP_SRC0_HIGH_MASK 0x0001FE00
-#define NV40_VP_SRC0_LOW_MASK 0x000001FF
-#define NV40_VP_SRC2_HIGH_SHIFT 11
-#define NV40_VP_SRC2_HIGH_MASK 0x0001F800
-#define NV40_VP_SRC2_LOW_MASK 0x000007FF
-
-/* Source selection - these are the bits you fill NV40_VP_INST_SRCn with */
-#define NV40_VP_SRC_NEGATE (1 << 16)
-#define NV40_VP_SRC_SWZ_X_SHIFT 14
-#define NV40_VP_SRC_SWZ_X_MASK (3 << 14)
-#define NV40_VP_SRC_SWZ_Y_SHIFT 12
-#define NV40_VP_SRC_SWZ_Y_MASK (3 << 12)
-#define NV40_VP_SRC_SWZ_Z_SHIFT 10
-#define NV40_VP_SRC_SWZ_Z_MASK (3 << 10)
-#define NV40_VP_SRC_SWZ_W_SHIFT 8
-#define NV40_VP_SRC_SWZ_W_MASK (3 << 8)
-#define NV40_VP_SRC_SWZ_ALL_SHIFT 8
-#define NV40_VP_SRC_SWZ_ALL_MASK (0xFF << 8)
-#define NV40_VP_SRC_TEMP_SRC_SHIFT 2
-#define NV40_VP_SRC_TEMP_SRC_MASK (0x1F << 2)
-#define NV40_VP_SRC_REG_TYPE_SHIFT 0
-#define NV40_VP_SRC_REG_TYPE_MASK (3 << 0)
-# define NV40_VP_SRC_REG_TYPE_UNK0 0
-# define NV40_VP_SRC_REG_TYPE_TEMP 1
-# define NV40_VP_SRC_REG_TYPE_INPUT 2
-# define NV40_VP_SRC_REG_TYPE_CONST 3
-
-#include "nvfx_shader.h"
-
-#endif
+++ /dev/null
-
-#include "util/u_inlines.h"
-#include "util/u_memory.h"
-#include "util/u_math.h"
-
-#include "nouveau/nouveau_screen.h"
-#include "nouveau/nouveau_winsys.h"
-#include "nvfx_resource.h"
-#include "nvfx_screen.h"
-
-void nvfx_buffer_destroy(struct pipe_screen *pscreen,
- struct pipe_resource *presource)
-{
- struct nvfx_buffer *buffer = nvfx_buffer(presource);
-
- if(!(buffer->base.base.flags & NVFX_RESOURCE_FLAG_USER))
- align_free(buffer->data);
- nouveau_screen_bo_release(pscreen, buffer->base.bo);
- FREE(buffer);
-}
-
-struct pipe_resource *
-nvfx_buffer_create(struct pipe_screen *pscreen,
- const struct pipe_resource *template)
-{
- struct nvfx_screen* screen = nvfx_screen(pscreen);
- struct nvfx_buffer* buffer;
-
- buffer = CALLOC_STRUCT(nvfx_buffer);
- if (!buffer)
- return NULL;
-
- buffer->base.base = *template;
- buffer->base.base.flags |= NOUVEAU_RESOURCE_FLAG_LINEAR;
- pipe_reference_init(&buffer->base.base.reference, 1);
- buffer->base.base.screen = pscreen;
- buffer->size = util_format_get_stride(template->format, template->width0);
- buffer->bytes_to_draw_until_static = buffer->size * screen->static_reuse_threshold;
- buffer->data = align_malloc(buffer->size, 16);
-
- return &buffer->base.base;
-}
-
-
-struct pipe_resource *
-nvfx_user_buffer_create(struct pipe_screen *pscreen,
- void *ptr,
- unsigned bytes,
- unsigned usage)
-{
- struct nvfx_screen* screen = nvfx_screen(pscreen);
- struct nvfx_buffer* buffer;
-
- buffer = CALLOC_STRUCT(nvfx_buffer);
- if (!buffer)
- return NULL;
-
- pipe_reference_init(&buffer->base.base.reference, 1);
- buffer->base.base.flags =
- NOUVEAU_RESOURCE_FLAG_LINEAR | NVFX_RESOURCE_FLAG_USER;
- buffer->base.base.screen = pscreen;
- buffer->base.base.format = PIPE_FORMAT_R8_UNORM;
- buffer->base.base.usage = PIPE_USAGE_IMMUTABLE;
- buffer->base.base.bind = usage;
- buffer->base.base.width0 = bytes;
- buffer->base.base.height0 = 1;
- buffer->base.base.depth0 = 1;
- buffer->base.base.array_size = 1;
- buffer->data = ptr;
- buffer->size = bytes;
- buffer->bytes_to_draw_until_static = bytes * screen->static_reuse_threshold;
- buffer->dirty_end = bytes;
-
- return &buffer->base.base;
-}
-
-void nvfx_buffer_upload(struct nvfx_buffer* buffer)
-{
- unsigned dirty = buffer->dirty_end - buffer->dirty_begin;
- if(!buffer->base.bo)
- {
- buffer->base.bo = nouveau_screen_bo_new(buffer->base.base.screen,
- 16,
- buffer->base.base.usage,
- buffer->base.base.bind,
- buffer->base.base.width0);
- }
-
- if(dirty)
- {
- // TODO: may want to use a temporary in some cases
- nouveau_bo_map(buffer->base.bo, NOUVEAU_BO_WR
- | (buffer->dirty_unsynchronized ? NOUVEAU_BO_NOSYNC : 0));
- memcpy((uint8_t*)buffer->base.bo->map + buffer->dirty_begin, buffer->data + buffer->dirty_begin, dirty);
- nouveau_bo_unmap(buffer->base.bo);
- buffer->dirty_begin = buffer->dirty_end = 0;
- }
-}
+++ /dev/null
-#include "pipe/p_context.h"
-#include "pipe/p_defines.h"
-#include "pipe/p_state.h"
-#include "util/u_clear.h"
-
-#include "nvfx_context.h"
-
-void
-nvfx_clear(struct pipe_context *pipe, unsigned buffers,
- const union pipe_color_union *color, double depth, unsigned stencil)
-{
- util_clear(pipe, &nvfx_context(pipe)->framebuffer, buffers, color, depth,
- stencil);
-}
+++ /dev/null
-#include "draw/draw_context.h"
-#include "pipe/p_defines.h"
-#include "util/u_framebuffer.h"
-#include "vl/vl_decoder.h"
-#include "vl/vl_video_buffer.h"
-
-#include "nvfx_context.h"
-#include "nvfx_screen.h"
-#include "nvfx_resource.h"
-
-static void
-nvfx_flush(struct pipe_context *pipe,
- struct pipe_fence_handle **fence)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_screen *screen = nvfx->screen;
- struct nouveau_channel *chan = screen->base.channel;
- /*struct nouveau_grobj *eng3d = screen->eng3d;*/
-
- /* XXX: we need to actually be intelligent here */
- /* XXX This flag wasn't set by the state tracker anyway. */
- /*if (flags & PIPE_FLUSH_TEXTURE_CACHE) {
- BEGIN_RING(chan, eng3d, 0x1fd8, 1);
- OUT_RING(chan, 2);
- BEGIN_RING(chan, eng3d, 0x1fd8, 1);
- OUT_RING(chan, 1);
- }*/
-
- if (fence) {
- /* horrific hack to make glFinish() work in the absence of
- * having proper fences in nvfx. a pending rewrite will
- * fix this properly, but may be a while off.
- */
- MARK_RING(chan, 1, 1);
- OUT_RELOC(chan, screen->fence, 0, NOUVEAU_BO_WR |
- NOUVEAU_BO_DUMMY, 0, 0);
- FIRE_RING(chan);
- nouveau_bo_map(screen->fence, NOUVEAU_BO_RDWR);
- nouveau_bo_unmap(screen->fence);
- *fence = NULL;
- } else {
- FIRE_RING(chan);
- }
-}
-
-static void
-nvfx_destroy(struct pipe_context *pipe)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- if(nvfx->dummy_fs)
- pipe->delete_fs_state(pipe, nvfx->dummy_fs);
-
- for(unsigned i = 0; i < nvfx->vtxbuf_nr; ++i)
- pipe_resource_reference(&nvfx->vtxbuf[i].buffer, 0);
- pipe_resource_reference(&nvfx->idxbuf.buffer, 0);
- util_unreference_framebuffer_state(&nvfx->framebuffer);
- for(unsigned i = 0; i < PIPE_MAX_SAMPLERS; ++i)
- pipe_sampler_view_reference(&nvfx->fragment_sampler_views[i], 0);
-
- if (nvfx->draw)
- draw_destroy(nvfx->draw);
-
- if(nvfx->screen->cur_ctx == nvfx)
- nvfx->screen->cur_ctx = NULL;
-
- FREE(nvfx);
-}
-
-struct pipe_context *
-nvfx_create(struct pipe_screen *pscreen, void *priv)
-{
- struct nvfx_screen *screen = nvfx_screen(pscreen);
- struct nvfx_context *nvfx;
-
- nvfx = CALLOC(1, sizeof(struct nvfx_context));
- if (!nvfx)
- return NULL;
- nvfx->screen = screen;
-
- nvfx->pipe.screen = pscreen;
- nvfx->pipe.priv = priv;
- nvfx->pipe.destroy = nvfx_destroy;
- nvfx->pipe.draw_vbo = nvfx_draw_vbo;
- nvfx->pipe.clear = nvfx_clear;
- nvfx->pipe.flush = nvfx_flush;
-
- nvfx->is_nv4x = screen->is_nv4x;
- nvfx->use_nv4x = screen->use_nv4x;
- /* TODO: it seems that nv30 might have fixed function clipping usable with vertex programs
- * However, my code for that doesn't work, so use vp clipping for all cards, which works.
- */
- nvfx->use_vp_clipping = TRUE;
-
- nvfx_init_query_functions(nvfx);
- nvfx_init_surface_functions(nvfx);
- nvfx_init_state_functions(nvfx);
- nvfx_init_sampling_functions(nvfx);
- nvfx_init_vbo_functions(nvfx);
- nvfx_init_fragprog_functions(nvfx);
- nvfx_init_vertprog_functions(nvfx);
- nvfx_init_resource_functions(&nvfx->pipe);
- nvfx_init_transfer_functions(&nvfx->pipe);
-
- /* Create, configure, and install fallback swtnl path */
- nvfx->draw = draw_create(&nvfx->pipe);
- draw_wide_point_threshold(nvfx->draw, 9999999.0);
- draw_wide_line_threshold(nvfx->draw, 9999999.0);
- draw_enable_line_stipple(nvfx->draw, FALSE);
- draw_enable_point_sprites(nvfx->draw, FALSE);
- draw_set_rasterize_stage(nvfx->draw, nvfx_draw_render_stage(nvfx));
-
- /* set these to that we init them on first validation */
- nvfx->state.scissor_enabled = ~0;
- nvfx->hw_pointsprite_control = -1;
- nvfx->hw_vp_output = -1;
- nvfx->use_vertex_buffers = -1;
- nvfx->relocs_needed = NVFX_RELOCATE_ALL;
-
- LIST_INITHEAD(&nvfx->render_cache);
- nvfx_context_init_vdec(nvfx);
-
- return &nvfx->pipe;
-}
+++ /dev/null
-#ifndef __NVFX_CONTEXT_H__
-#define __NVFX_CONTEXT_H__
-
-#include <stdio.h>
-
-#include "pipe/p_context.h"
-#include "pipe/p_defines.h"
-#include "pipe/p_state.h"
-#include "pipe/p_compiler.h"
-
-#include "util/u_memory.h"
-#include "util/u_math.h"
-#include "util/u_inlines.h"
-#include "util/u_double_list.h"
-
-#include "draw/draw_vertex.h"
-#include "util/u_blitter.h"
-
-#include "nouveau/nouveau_winsys.h"
-#include "nouveau/nouveau_gldefs.h"
-#include "nouveau/nouveau_resource.h"
-#include "nv30-40_3d.xml.h"
-#include "nvfx_state.h"
-
-#define NOUVEAU_ERR(fmt, args...) \
- fprintf(stderr, "%s:%d - "fmt, __func__, __LINE__, ##args);
-#define NOUVEAU_MSG(fmt, args...) \
- fprintf(stderr, "nouveau: "fmt, ##args);
-
-#include "nvfx_screen.h"
-
-#define NVFX_NEW_BLEND (1 << 0)
-#define NVFX_NEW_RAST (1 << 1)
-#define NVFX_NEW_ZSA (1 << 2)
-#define NVFX_NEW_SAMPLER (1 << 3)
-#define NVFX_NEW_FB (1 << 4)
-#define NVFX_NEW_STIPPLE (1 << 5)
-#define NVFX_NEW_SCISSOR (1 << 6)
-#define NVFX_NEW_VIEWPORT (1 << 7)
-#define NVFX_NEW_BCOL (1 << 8)
-#define NVFX_NEW_VERTPROG (1 << 9)
-#define NVFX_NEW_FRAGPROG (1 << 10)
-#define NVFX_NEW_ARRAYS (1 << 11)
-#define NVFX_NEW_UCP (1 << 12)
-#define NVFX_NEW_SR (1 << 13)
-#define NVFX_NEW_VERTCONST (1 << 14)
-#define NVFX_NEW_FRAGCONST (1 << 15)
-#define NVFX_NEW_INDEX (1 << 16)
-#define NVFX_NEW_SPRITE (1 << 17)
-
-#define NVFX_RELOCATE_FRAMEBUFFER (1 << 0)
-#define NVFX_RELOCATE_FRAGTEX (1 << 1)
-#define NVFX_RELOCATE_FRAGPROG (1 << 2)
-#define NVFX_RELOCATE_VTXBUF (1 << 3)
-#define NVFX_RELOCATE_IDXBUF (1 << 4)
-#define NVFX_RELOCATE_ALL 0x1f
-
-struct nvfx_rasterizer_state {
- struct pipe_rasterizer_state pipe;
- unsigned sb_len;
- uint32_t sb[34];
-};
-
-struct nvfx_zsa_state {
- struct pipe_depth_stencil_alpha_state pipe;
- unsigned sb_len;
- uint32_t sb[24];
-};
-
-struct nvfx_blend_state {
- struct pipe_blend_state pipe;
- unsigned sb_len;
- uint32_t sb[13];
-};
-
-
-struct nvfx_state {
- unsigned scissor_enabled;
- unsigned fp_samplers;
- unsigned render_temps;
-};
-
-struct nvfx_per_vertex_element {
- unsigned idx;
- unsigned vertex_buffer_index;
- unsigned src_offset;
-};
-
-struct nvfx_low_frequency_element {
- unsigned idx;
- unsigned vertex_buffer_index;
- unsigned src_offset;
- void (*fetch_rgba_float)(float *dst, const uint8_t *src, unsigned i, unsigned j);
- unsigned ncomp;
-};
-
-struct nvfx_per_instance_element {
- struct nvfx_low_frequency_element base;
- unsigned instance_divisor;
-};
-
-struct nvfx_per_vertex_buffer_info
-{
- unsigned vertex_buffer_index;
- unsigned per_vertex_size;
-};
-
-struct nvfx_vtxelt_state {
- struct pipe_vertex_element pipe[16];
- unsigned num_elements;
- unsigned vtxfmt[16];
-
- unsigned num_per_vertex_buffer_infos;
- struct nvfx_per_vertex_buffer_info per_vertex_buffer_info[16];
-
- unsigned num_per_vertex;
- struct nvfx_per_vertex_element per_vertex[16];
-
- unsigned num_per_instance;
- struct nvfx_per_instance_element per_instance[16];
-
- unsigned num_constant;
- struct nvfx_low_frequency_element constant[16];
-
- boolean needs_translate;
- struct translate* translate;
-
- unsigned vertex_length;
- unsigned max_vertices_per_packet;
-};
-
-struct nvfx_render_target {
- struct nouveau_bo* bo;
- unsigned offset;
- unsigned pitch;
-};
-
-struct nvfx_context {
- struct pipe_context pipe;
-
- struct nvfx_screen *screen;
-
- unsigned is_nv4x; /* either 0 or ~0 */
- unsigned use_nv4x; /* either 0 or ~0 */
- boolean use_vp_clipping;
-
- struct draw_context *draw;
- /* one is for user-requested operations, the other is for temporary copying inside them */
- struct blitter_context* blitter[2];
- unsigned blitters_in_use;
- struct list_head render_cache;
-
- /* HW state derived from pipe states */
- struct nvfx_state state;
-
- enum {
- HW, SWTNL, SWRAST
- } render_mode;
- unsigned fallback_swtnl;
-
- /* Context state */
- unsigned dirty, draw_dirty;
- struct pipe_scissor_state scissor;
- unsigned stipple[32];
- struct pipe_clip_state clip;
- struct nvfx_pipe_vertex_program *vertprog;
- struct nvfx_pipe_fragment_program *fragprog;
- struct pipe_resource *constbuf[PIPE_SHADER_TYPES];
- unsigned constbuf_nr[PIPE_SHADER_TYPES];
- struct nvfx_rasterizer_state *rasterizer;
- struct nvfx_zsa_state *zsa;
- struct nvfx_blend_state *blend;
- struct pipe_blend_color blend_colour;
- struct pipe_stencil_ref stencil_ref;
- struct pipe_viewport_state viewport;
- struct pipe_framebuffer_state framebuffer;
- struct pipe_index_buffer idxbuf;
- struct nvfx_sampler_state *tex_sampler[PIPE_MAX_SAMPLERS];
- struct pipe_sampler_view *fragment_sampler_views[PIPE_MAX_SAMPLERS];
- struct nvfx_pipe_fragment_program* dummy_fs;
- struct pipe_query* query;
-
- unsigned nr_samplers;
- unsigned nr_textures;
- unsigned dirty_samplers;
- struct pipe_vertex_buffer vtxbuf[PIPE_MAX_ATTRIBS];
- unsigned vtxbuf_nr;
- struct nvfx_vtxelt_state *vtxelt;
- int base_vertex;
- boolean use_index_buffer;
- /* -1 = hardware input setup is outdated
- * 0 = hardware input setup is for inline vertices
- * 1 = hardware input setup is for hardware vertices
- */
- int use_vertex_buffers;
-
- unsigned hw_vtxelt_nr;
- unsigned hw_samplers;
- uint32_t hw_txf[16];
- struct nvfx_render_target hw_rt[4];
- struct nvfx_render_target hw_zeta;
- int hw_pointsprite_control;
- int hw_vp_output;
- struct nvfx_fragment_program* hw_fragprog;
- struct nvfx_vertex_program* hw_vertprog;
-
- unsigned relocs_needed;
-};
-
-static INLINE struct nvfx_context *
-nvfx_context(struct pipe_context *pipe)
-{
- return (struct nvfx_context *)pipe;
-}
-
-extern struct nvfx_state_entry nvfx_state_blend;
-extern struct nvfx_state_entry nvfx_state_blend_colour;
-extern struct nvfx_state_entry nvfx_state_fragprog;
-extern struct nvfx_state_entry nvfx_state_fragtex;
-extern struct nvfx_state_entry nvfx_state_framebuffer;
-extern struct nvfx_state_entry nvfx_state_rasterizer;
-extern struct nvfx_state_entry nvfx_state_scissor;
-extern struct nvfx_state_entry nvfx_state_sr;
-extern struct nvfx_state_entry nvfx_state_stipple;
-extern struct nvfx_state_entry nvfx_state_vbo;
-extern struct nvfx_state_entry nvfx_state_vertprog;
-extern struct nvfx_state_entry nvfx_state_viewport;
-extern struct nvfx_state_entry nvfx_state_vtxfmt;
-extern struct nvfx_state_entry nvfx_state_zsa;
-
-extern void nvfx_init_query_functions(struct nvfx_context *nvfx);
-extern void nvfx_init_surface_functions(struct nvfx_context *nvfx);
-
-/* nvfx_context.c */
-struct pipe_context *
-nvfx_create(struct pipe_screen *pscreen, void *priv);
-
-/* nvfx_clear.c */
-extern void nvfx_clear(struct pipe_context *pipe, unsigned buffers,
- const union pipe_color_union *color,
- double depth, unsigned stencil);
-
-/* nvfx_draw.c */
-extern struct draw_stage *nvfx_draw_render_stage(struct nvfx_context *nvfx);
-extern void nvfx_draw_vbo_swtnl(struct pipe_context *pipe, const struct pipe_draw_info* info);
-extern void nvfx_vtxfmt_validate(struct nvfx_context *nvfx);
-
-/* nvfx_fb.c */
-extern int nvfx_framebuffer_prepare(struct nvfx_context *nvfx);
-extern void nvfx_framebuffer_validate(struct nvfx_context *nvfx);
-void
-nvfx_framebuffer_relocate(struct nvfx_context *nvfx);
-
-/* nvfx_fragprog.c */
-extern void nvfx_fragprog_destroy(struct nvfx_context *,
- struct nvfx_fragment_program *);
-extern void nvfx_fragprog_validate(struct nvfx_context *nvfx);
-extern void nvfx_fragprog_relocate(struct nvfx_context *nvfx);
-extern void nvfx_init_fragprog_functions(struct nvfx_context *nvfx);
-
-/* nvfx_fragtex.c */
-extern void nvfx_init_sampling_functions(struct nvfx_context *nvfx);
-extern void nvfx_fragtex_validate(struct nvfx_context *nvfx);
-extern void nvfx_fragtex_relocate(struct nvfx_context *nvfx);
-
-struct nvfx_sampler_view;
-
-/* nv30_fragtex.c */
-extern void
-nv30_sampler_state_init(struct pipe_context *pipe,
- struct nvfx_sampler_state *ps,
- const struct pipe_sampler_state *cso);
-extern void
-nv30_sampler_view_init(struct pipe_context *pipe,
- struct nvfx_sampler_view *sv);
-extern void nv30_fragtex_set(struct nvfx_context *nvfx, int unit);
-
-/* nv40_fragtex.c */
-extern void
-nv40_sampler_state_init(struct pipe_context *pipe,
- struct nvfx_sampler_state *ps,
- const struct pipe_sampler_state *cso);
-extern void
-nv40_sampler_view_init(struct pipe_context *pipe,
- struct nvfx_sampler_view *sv);
-extern void nv40_fragtex_set(struct nvfx_context *nvfx, int unit);
-
-/* nvfx_state.c */
-extern void nvfx_init_state_functions(struct nvfx_context *nvfx);
-extern void nvfx_state_scissor_validate(struct nvfx_context *nvfx);
-extern void nvfx_state_stipple_validate(struct nvfx_context *nvfx);
-extern void nvfx_state_blend_validate(struct nvfx_context *nvfx);
-extern void nvfx_state_blend_colour_validate(struct nvfx_context *nvfx);
-extern void nvfx_state_viewport_validate(struct nvfx_context *nvfx);
-extern void nvfx_state_rasterizer_validate(struct nvfx_context *nvfx);
-extern void nvfx_state_sr_validate(struct nvfx_context *nvfx);
-extern void nvfx_state_zsa_validate(struct nvfx_context *nvfx);
-
-/* nvfx_state_emit.c */
-extern void nvfx_state_relocate(struct nvfx_context *nvfx, unsigned relocs);
-extern boolean nvfx_state_validate(struct nvfx_context *nvfx);
-extern boolean nvfx_state_validate_swtnl(struct nvfx_context *nvfx);
-
-static inline void
-nvfx_state_emit(struct nvfx_context *nvfx)
-{
- unsigned relocs = NVFX_RELOCATE_FRAMEBUFFER | NVFX_RELOCATE_FRAGTEX | NVFX_RELOCATE_FRAGPROG;
- if (nvfx->render_mode == HW)
- {
- relocs |= NVFX_RELOCATE_VTXBUF;
- if(nvfx->use_index_buffer)
- relocs |= NVFX_RELOCATE_IDXBUF;
- }
-
- relocs &= nvfx->relocs_needed;
- if(relocs)
- nvfx_state_relocate(nvfx, relocs);
-}
-
-/* nvfx_transfer.c */
-extern void nvfx_init_transfer_functions(struct pipe_context *pipe);
-
-/* nvfx_vbo.c */
-extern boolean nvfx_vbo_validate(struct nvfx_context *nvfx);
-extern void nvfx_vbo_swtnl_validate(struct nvfx_context *nvfx);
-extern void nvfx_vbo_relocate(struct nvfx_context *nvfx);
-extern void nvfx_idxbuf_validate(struct nvfx_context* nvfx);
-extern void nvfx_idxbuf_relocate(struct nvfx_context* nvfx);
-extern void nvfx_draw_vbo(struct pipe_context *pipe,
- const struct pipe_draw_info *info);
-extern void nvfx_init_vbo_functions(struct nvfx_context *nvfx);
-extern unsigned nvfx_vertex_formats[];
-
-/* nvfx_vertprog.c */
-extern boolean nvfx_vertprog_validate(struct nvfx_context *nvfx);
-extern void nvfx_vertprog_destroy(struct nvfx_context *,
- struct nvfx_vertex_program *);
-extern void nvfx_init_vertprog_functions(struct nvfx_context *nvfx);
-
-/* nvfx_push.c */
-extern void nvfx_push_vbo(struct pipe_context *pipe, const struct pipe_draw_info *info);
-
-extern void nvfx_context_init_vdec(struct nvfx_context *);
-
-static inline void nvfx_emit_vtx_attr(struct nouveau_channel* chan,
- struct nouveau_grobj *eng3d, unsigned attrib, const float* v,
- unsigned ncomp)
-{
- switch (ncomp) {
- case 4:
- BEGIN_RING(chan, eng3d, NV30_3D_VTX_ATTR_4F_X(attrib), 4);
- OUT_RING(chan, fui(v[0]));
- OUT_RING(chan, fui(v[1]));
- OUT_RING(chan, fui(v[2]));
- OUT_RING(chan, fui(v[3]));
- break;
- case 3:
- BEGIN_RING(chan, eng3d, NV30_3D_VTX_ATTR_3F_X(attrib), 3);
- OUT_RING(chan, fui(v[0]));
- OUT_RING(chan, fui(v[1]));
- OUT_RING(chan, fui(v[2]));
- break;
- case 2:
- BEGIN_RING(chan, eng3d, NV30_3D_VTX_ATTR_2F_X(attrib), 2);
- OUT_RING(chan, fui(v[0]));
- OUT_RING(chan, fui(v[1]));
- break;
- case 1:
- BEGIN_RING(chan, eng3d, NV30_3D_VTX_ATTR_1F(attrib), 1);
- OUT_RING(chan, fui(v[0]));
- break;
- }
-}
-
-#endif
+++ /dev/null
-#include "pipe/p_shader_tokens.h"
-#include "util/u_inlines.h"
-
-#include "util/u_pack_color.h"
-
-#include "draw/draw_context.h"
-#include "draw/draw_vertex.h"
-#include "draw/draw_pipe.h"
-
-#include "nvfx_context.h"
-#include "nvfx_resource.h"
-
-struct nvfx_render_stage {
- struct draw_stage stage;
- struct nvfx_context *nvfx;
- unsigned prim;
-};
-
-static INLINE struct nvfx_render_stage *
-nvfx_render_stage(struct draw_stage *stage)
-{
- return (struct nvfx_render_stage *)stage;
-}
-
-static void
-nvfx_render_flush(struct draw_stage *stage, unsigned flags)
-{
- struct nvfx_render_stage *rs = nvfx_render_stage(stage);
- struct nvfx_context *nvfx = rs->nvfx;
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
-
- if (rs->prim != NV30_3D_VERTEX_BEGIN_END_STOP) {
- BEGIN_RING(chan, eng3d, NV30_3D_VERTEX_BEGIN_END, 1);
- OUT_RING(chan, NV30_3D_VERTEX_BEGIN_END_STOP);
- rs->prim = NV30_3D_VERTEX_BEGIN_END_STOP;
- }
-}
-
-static INLINE void
-nvfx_render_prim(struct draw_stage *stage, struct prim_header *prim,
- unsigned mode, unsigned count)
-{
- struct nvfx_render_stage *rs = nvfx_render_stage(stage);
- struct nvfx_context *nvfx = rs->nvfx;
-
- struct nvfx_screen *screen = nvfx->screen;
- struct nouveau_channel *chan = screen->base.channel;
- struct nouveau_grobj *eng3d = screen->eng3d;
- boolean no_elements = nvfx->vertprog->draw_no_elements;
- unsigned num_attribs = nvfx->vertprog->draw_elements;
-
- /* we need to account the flush as well here even if it is done afterthis
- * function
- */
- if (AVAIL_RING(chan) < ((1 + count * num_attribs * 4) + 6 + 64)) {
- nvfx_render_flush(stage, 0);
- FIRE_RING(chan);
- nvfx_state_emit(nvfx);
-
- assert(AVAIL_RING(chan) >= ((1 + count * num_attribs * 4) + 6 + 64));
- }
-
- /* Switch primitive modes if necessary */
- if (rs->prim != mode) {
- if (rs->prim != NV30_3D_VERTEX_BEGIN_END_STOP) {
- BEGIN_RING(chan, eng3d, NV30_3D_VERTEX_BEGIN_END, 1);
- OUT_RING(chan, NV30_3D_VERTEX_BEGIN_END_STOP);
- }
-
- /* XXX: any command a lot of times seems to (mostly) fix corruption that would otherwise happen */
- /* this seems to cause issues on nv3x, and also be unneeded there */
- if(nvfx->is_nv4x)
- {
- int i;
- for(i = 0; i < 32; ++i)
- {
- BEGIN_RING(chan, eng3d, 0x1dac, 1);
- OUT_RING(chan, 0);
- }
- }
-
- BEGIN_RING(chan, eng3d, NV30_3D_VERTEX_BEGIN_END, 1);
- OUT_RING (chan, mode);
- rs->prim = mode;
- }
-
- if(no_elements) {
- BEGIN_RING_NI(chan, eng3d, NV30_3D_VERTEX_DATA, 4);
- OUT_RING(chan, 0);
- OUT_RING(chan, 0);
- OUT_RING(chan, 0);
- OUT_RING(chan, 0);
- } else {
- BEGIN_RING_NI(chan, eng3d, NV30_3D_VERTEX_DATA, num_attribs * 4 * count);
- for (unsigned i = 0; i < count; ++i)
- {
- struct vertex_header* v = prim->v[i];
- /* TODO: disable divide where it's causing the problem, and remove this hack */
- OUT_RING(chan, fui(v->data[0][0] / v->data[0][3]));
- OUT_RING(chan, fui(v->data[0][1] / v->data[0][3]));
- OUT_RING(chan, fui(v->data[0][2] / v->data[0][3]));
- OUT_RING(chan, fui(1.0f / v->data[0][3]));
- OUT_RINGp(chan, &v->data[1][0], 4 * (num_attribs - 1));
- }
- }
-}
-
-static void
-nvfx_render_point(struct draw_stage *draw, struct prim_header *prim)
-{
- nvfx_render_prim(draw, prim, NV30_3D_VERTEX_BEGIN_END_POINTS, 1);
-}
-
-static void
-nvfx_render_line(struct draw_stage *draw, struct prim_header *prim)
-{
- nvfx_render_prim(draw, prim, NV30_3D_VERTEX_BEGIN_END_LINES, 2);
-}
-
-static void
-nvfx_render_tri(struct draw_stage *draw, struct prim_header *prim)
-{
- nvfx_render_prim(draw, prim, NV30_3D_VERTEX_BEGIN_END_TRIANGLES, 3);
-}
-
-static void
-nvfx_render_reset_stipple_counter(struct draw_stage *draw)
-{
- /* this doesn't really seem to work, but it matters rather little */
- nvfx_render_flush(draw, 0);
-}
-
-static void
-nvfx_render_destroy(struct draw_stage *draw)
-{
- FREE(draw);
-}
-
-struct draw_stage *
-nvfx_draw_render_stage(struct nvfx_context *nvfx)
-{
- struct nvfx_render_stage *render = CALLOC_STRUCT(nvfx_render_stage);
-
- render->nvfx = nvfx;
- render->stage.draw = nvfx->draw;
- render->stage.point = nvfx_render_point;
- render->stage.line = nvfx_render_line;
- render->stage.tri = nvfx_render_tri;
- render->stage.flush = nvfx_render_flush;
- render->stage.reset_stipple_counter = nvfx_render_reset_stipple_counter;
- render->stage.destroy = nvfx_render_destroy;
-
- return &render->stage;
-}
-
-void
-nvfx_draw_vbo_swtnl(struct pipe_context *pipe, const struct pipe_draw_info* info)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- unsigned i;
- void *map;
-
- if (!nvfx_state_validate_swtnl(nvfx))
- return;
-
- nvfx_state_emit(nvfx);
-
- /* these must be passed without adding the offsets */
- for (i = 0; i < nvfx->vtxbuf_nr; i++) {
- map = nvfx_buffer(nvfx->vtxbuf[i].buffer)->data;
- draw_set_mapped_vertex_buffer(nvfx->draw, i, map);
- }
-
- map = NULL;
- if (info->indexed && nvfx->idxbuf.buffer)
- map = nvfx_buffer(nvfx->idxbuf.buffer)->data;
- draw_set_mapped_index_buffer(nvfx->draw, map);
-
- if (nvfx->constbuf[PIPE_SHADER_VERTEX]) {
- const unsigned nr = nvfx->constbuf_nr[PIPE_SHADER_VERTEX];
-
- map = nvfx_buffer(nvfx->constbuf[PIPE_SHADER_VERTEX])->data;
- draw_set_mapped_constant_buffer(nvfx->draw, PIPE_SHADER_VERTEX, 0,
- map, nr);
- }
-
- draw_vbo(nvfx->draw, info);
-
- draw_flush(nvfx->draw);
-}
+++ /dev/null
-#include <float.h>
-#include "pipe/p_context.h"
-#include "pipe/p_defines.h"
-#include "pipe/p_state.h"
-#include "util/u_inlines.h"
-#include "util/u_debug.h"
-
-#include "pipe/p_shader_tokens.h"
-#include "tgsi/tgsi_parse.h"
-#include "tgsi/tgsi_util.h"
-#include "tgsi/tgsi_dump.h"
-#include "tgsi/tgsi_ureg.h"
-
-#include "nvfx_context.h"
-#include "nvfx_shader.h"
-#include "nvfx_resource.h"
-
-struct nvfx_fpc {
- struct nvfx_pipe_fragment_program* pfp;
- struct nvfx_fragment_program *fp;
-
- unsigned max_temps;
- unsigned long long r_temps;
- unsigned long long r_temps_discard;
- struct nvfx_reg r_result[PIPE_MAX_SHADER_OUTPUTS];
- struct nvfx_reg *r_temp;
- unsigned sprite_coord_temp;
-
- int num_regs;
-
- unsigned inst_offset;
- unsigned have_const;
-
- struct util_dynarray imm_data;
-
- struct nvfx_reg* r_imm;
- unsigned nr_imm;
-
- unsigned char generic_to_slot[256]; /* semantic idx for each input semantic */
-
- struct util_dynarray if_stack;
- //struct util_dynarray loop_stack;
- struct util_dynarray label_relocs;
-};
-
-static INLINE struct nvfx_reg
-temp(struct nvfx_fpc *fpc)
-{
- int idx = __builtin_ctzll(~fpc->r_temps);
-
- if (idx >= fpc->max_temps) {
- NOUVEAU_ERR("out of temps!!\n");
- assert(0);
- return nvfx_reg(NVFXSR_TEMP, 0);
- }
-
- fpc->r_temps |= (1ULL << idx);
- fpc->r_temps_discard |= (1ULL << idx);
- return nvfx_reg(NVFXSR_TEMP, idx);
-}
-
-static INLINE void
-release_temps(struct nvfx_fpc *fpc)
-{
- fpc->r_temps &= ~fpc->r_temps_discard;
- fpc->r_temps_discard = 0ULL;
-}
-
-static inline struct nvfx_reg
-nvfx_fp_imm(struct nvfx_fpc *fpc, float a, float b, float c, float d)
-{
- float v[4] = {a, b, c, d};
- int idx = fpc->imm_data.size >> 4;
-
- memcpy(util_dynarray_grow(&fpc->imm_data, sizeof(float) * 4), v, 4 * sizeof(float));
- return nvfx_reg(NVFXSR_IMM, idx);
-}
-
-static void
-grow_insns(struct nvfx_fpc *fpc, int size)
-{
- struct nvfx_fragment_program *fp = fpc->fp;
-
- fp->insn_len += size;
- fp->insn = realloc(fp->insn, sizeof(uint32_t) * fp->insn_len);
-}
-
-static void
-emit_src(struct nvfx_fpc *fpc, int pos, struct nvfx_src src)
-{
- struct nvfx_fragment_program *fp = fpc->fp;
- uint32_t *hw = &fp->insn[fpc->inst_offset];
- uint32_t sr = 0;
-
- switch (src.reg.type) {
- case NVFXSR_INPUT:
- sr |= (NVFX_FP_REG_TYPE_INPUT << NVFX_FP_REG_TYPE_SHIFT);
- hw[0] |= (src.reg.index << NVFX_FP_OP_INPUT_SRC_SHIFT);
- break;
- case NVFXSR_OUTPUT:
- sr |= NVFX_FP_REG_SRC_HALF;
- /* fall-through */
- case NVFXSR_TEMP:
- sr |= (NVFX_FP_REG_TYPE_TEMP << NVFX_FP_REG_TYPE_SHIFT);
- sr |= (src.reg.index << NVFX_FP_REG_SRC_SHIFT);
- break;
- case NVFXSR_RELOCATED:
- sr |= (NVFX_FP_REG_TYPE_TEMP << NVFX_FP_REG_TYPE_SHIFT);
- sr |= (fpc->sprite_coord_temp << NVFX_FP_REG_SRC_SHIFT);
- //printf("adding relocation at %x for %x\n", fpc->inst_offset, src.index);
- util_dynarray_append(&fpc->fp->slot_relocations[src.reg.index], unsigned, fpc->inst_offset + pos + 1);
- break;
- case NVFXSR_IMM:
- if (!fpc->have_const) {
- grow_insns(fpc, 4);
- hw = &fp->insn[fpc->inst_offset];
- fpc->have_const = 1;
- }
-
- memcpy(&fp->insn[fpc->inst_offset + 4],
- (float*)fpc->imm_data.data + src.reg.index * 4,
- sizeof(uint32_t) * 4);
-
- sr |= (NVFX_FP_REG_TYPE_CONST << NVFX_FP_REG_TYPE_SHIFT);
- break;
- case NVFXSR_CONST:
- if (!fpc->have_const) {
- grow_insns(fpc, 4);
- hw = &fp->insn[fpc->inst_offset];
- fpc->have_const = 1;
- }
-
- {
- struct nvfx_fragment_program_data *fpd;
-
- fp->consts = realloc(fp->consts, ++fp->nr_consts *
- sizeof(*fpd));
- fpd = &fp->consts[fp->nr_consts - 1];
- fpd->offset = fpc->inst_offset + 4;
- fpd->index = src.reg.index;
- memset(&fp->insn[fpd->offset], 0, sizeof(uint32_t) * 4);
- }
-
- sr |= (NVFX_FP_REG_TYPE_CONST << NVFX_FP_REG_TYPE_SHIFT);
- break;
- case NVFXSR_NONE:
- sr |= (NVFX_FP_REG_TYPE_INPUT << NVFX_FP_REG_TYPE_SHIFT);
- break;
- default:
- assert(0);
- }
-
- if (src.negate)
- sr |= NVFX_FP_REG_NEGATE;
-
- if (src.abs)
- hw[1] |= (1 << (29 + pos));
-
- sr |= ((src.swz[0] << NVFX_FP_REG_SWZ_X_SHIFT) |
- (src.swz[1] << NVFX_FP_REG_SWZ_Y_SHIFT) |
- (src.swz[2] << NVFX_FP_REG_SWZ_Z_SHIFT) |
- (src.swz[3] << NVFX_FP_REG_SWZ_W_SHIFT));
-
- hw[pos + 1] |= sr;
-}
-
-static void
-emit_dst(struct nvfx_fpc *fpc, struct nvfx_reg dst)
-{
- struct nvfx_fragment_program *fp = fpc->fp;
- uint32_t *hw = &fp->insn[fpc->inst_offset];
-
- switch (dst.type) {
- case NVFXSR_TEMP:
- if (fpc->num_regs < (dst.index + 1))
- fpc->num_regs = dst.index + 1;
- break;
- case NVFXSR_OUTPUT:
- if (dst.index == 1) {
- fp->fp_control |= 0xe;
- } else {
- hw[0] |= NVFX_FP_OP_OUT_REG_HALF;
- }
- break;
- case NVFXSR_NONE:
- hw[0] |= (1 << 30);
- break;
- default:
- assert(0);
- }
-
- hw[0] |= (dst.index << NVFX_FP_OP_OUT_REG_SHIFT);
-}
-
-static void
-nvfx_fp_emit(struct nvfx_fpc *fpc, struct nvfx_insn insn)
-{
- struct nvfx_fragment_program *fp = fpc->fp;
- uint32_t *hw;
-
- fpc->inst_offset = fp->insn_len;
- fpc->have_const = 0;
- grow_insns(fpc, 4);
- hw = &fp->insn[fpc->inst_offset];
- memset(hw, 0, sizeof(uint32_t) * 4);
-
- if (insn.op == NVFX_FP_OP_OPCODE_KIL)
- fp->fp_control |= NV30_3D_FP_CONTROL_USES_KIL;
- hw[0] |= (insn.op << NVFX_FP_OP_OPCODE_SHIFT);
- hw[0] |= (insn.mask << NVFX_FP_OP_OUTMASK_SHIFT);
- hw[2] |= (insn.scale << NVFX_FP_OP_DST_SCALE_SHIFT);
-
- if (insn.sat)
- hw[0] |= NVFX_FP_OP_OUT_SAT;
-
- if (insn.cc_update)
- hw[0] |= NVFX_FP_OP_COND_WRITE_ENABLE;
- hw[1] |= (insn.cc_test << NVFX_FP_OP_COND_SHIFT);
- hw[1] |= ((insn.cc_swz[0] << NVFX_FP_OP_COND_SWZ_X_SHIFT) |
- (insn.cc_swz[1] << NVFX_FP_OP_COND_SWZ_Y_SHIFT) |
- (insn.cc_swz[2] << NVFX_FP_OP_COND_SWZ_Z_SHIFT) |
- (insn.cc_swz[3] << NVFX_FP_OP_COND_SWZ_W_SHIFT));
-
- if(insn.unit >= 0)
- {
- hw[0] |= (insn.unit << NVFX_FP_OP_TEX_UNIT_SHIFT);
- fp->samplers |= (1 << insn.unit);
- }
-
- emit_dst(fpc, insn.dst);
- emit_src(fpc, 0, insn.src[0]);
- emit_src(fpc, 1, insn.src[1]);
- emit_src(fpc, 2, insn.src[2]);
-}
-
-#define arith(s,o,d,m,s0,s1,s2) \
- nvfx_insn((s), NVFX_FP_OP_OPCODE_##o, -1, \
- (d), (m), (s0), (s1), (s2))
-
-#define tex(s,o,u,d,m,s0,s1,s2) \
- nvfx_insn((s), NVFX_FP_OP_OPCODE_##o, (u), \
- (d), (m), (s0), none, none)
-
-/* IF src.x != 0, as TGSI specifies */
-static void
-nv40_fp_if(struct nvfx_fpc *fpc, struct nvfx_src src)
-{
- const struct nvfx_src none = nvfx_src(nvfx_reg(NVFXSR_NONE, 0));
- struct nvfx_insn insn = arith(0, MOV, none.reg, NVFX_FP_MASK_X, src, none, none);
- uint32_t *hw;
- insn.cc_update = 1;
- nvfx_fp_emit(fpc, insn);
-
- fpc->inst_offset = fpc->fp->insn_len;
- grow_insns(fpc, 4);
- hw = &fpc->fp->insn[fpc->inst_offset];
- /* I really wonder why fp16 precision is used. Presumably the hardware ignores it? */
- hw[0] = (NV40_FP_OP_BRA_OPCODE_IF << NVFX_FP_OP_OPCODE_SHIFT) |
- NV40_FP_OP_OUT_NONE |
- (NVFX_FP_PRECISION_FP16 << NVFX_FP_OP_PRECISION_SHIFT);
- /* Use .xxxx swizzle so that we check only src[0].x*/
- hw[1] = (0 << NVFX_FP_OP_COND_SWZ_X_SHIFT) |
- (0 << NVFX_FP_OP_COND_SWZ_Y_SHIFT) |
- (0 << NVFX_FP_OP_COND_SWZ_Z_SHIFT) |
- (0 << NVFX_FP_OP_COND_SWZ_W_SHIFT) |
- (NVFX_FP_OP_COND_NE << NVFX_FP_OP_COND_SHIFT);
- hw[2] = 0; /* | NV40_FP_OP_OPCODE_IS_BRANCH | else_offset */
- hw[3] = 0; /* | endif_offset */
- util_dynarray_append(&fpc->if_stack, unsigned, fpc->inst_offset);
-}
-
-/* IF src.x != 0, as TGSI specifies */
-static void
-nv40_fp_cal(struct nvfx_fpc *fpc, unsigned target)
-{
- struct nvfx_relocation reloc;
- uint32_t *hw;
- fpc->inst_offset = fpc->fp->insn_len;
- grow_insns(fpc, 4);
- hw = &fpc->fp->insn[fpc->inst_offset];
- /* I really wonder why fp16 precision is used. Presumably the hardware ignores it? */
- hw[0] = (NV40_FP_OP_BRA_OPCODE_CAL << NVFX_FP_OP_OPCODE_SHIFT);
- /* Use .xxxx swizzle so that we check only src[0].x*/
- hw[1] = (NVFX_SWZ_IDENTITY << NVFX_FP_OP_COND_SWZ_ALL_SHIFT) |
- (NVFX_FP_OP_COND_TR << NVFX_FP_OP_COND_SHIFT);
- hw[2] = NV40_FP_OP_OPCODE_IS_BRANCH; /* | call_offset */
- hw[3] = 0;
- reloc.target = target;
- reloc.location = fpc->inst_offset + 2;
- util_dynarray_append(&fpc->label_relocs, struct nvfx_relocation, reloc);
-}
-
-static void
-nv40_fp_ret(struct nvfx_fpc *fpc)
-{
- uint32_t *hw;
- fpc->inst_offset = fpc->fp->insn_len;
- grow_insns(fpc, 4);
- hw = &fpc->fp->insn[fpc->inst_offset];
- /* I really wonder why fp16 precision is used. Presumably the hardware ignores it? */
- hw[0] = (NV40_FP_OP_BRA_OPCODE_RET << NVFX_FP_OP_OPCODE_SHIFT);
- /* Use .xxxx swizzle so that we check only src[0].x*/
- hw[1] = (NVFX_SWZ_IDENTITY << NVFX_FP_OP_COND_SWZ_ALL_SHIFT) |
- (NVFX_FP_OP_COND_TR << NVFX_FP_OP_COND_SHIFT);
- hw[2] = NV40_FP_OP_OPCODE_IS_BRANCH; /* | call_offset */
- hw[3] = 0;
-}
-
-static void
-nv40_fp_rep(struct nvfx_fpc *fpc, unsigned count, unsigned target)
-{
- struct nvfx_relocation reloc;
- uint32_t *hw;
- fpc->inst_offset = fpc->fp->insn_len;
- grow_insns(fpc, 4);
- hw = &fpc->fp->insn[fpc->inst_offset];
- /* I really wonder why fp16 precision is used. Presumably the hardware ignores it? */
- hw[0] = (NV40_FP_OP_BRA_OPCODE_REP << NVFX_FP_OP_OPCODE_SHIFT) |
- NV40_FP_OP_OUT_NONE |
- (NVFX_FP_PRECISION_FP16 << NVFX_FP_OP_PRECISION_SHIFT);
- /* Use .xxxx swizzle so that we check only src[0].x*/
- hw[1] = (NVFX_SWZ_IDENTITY << NVFX_FP_OP_COND_SWZ_ALL_SHIFT) |
- (NVFX_FP_OP_COND_TR << NVFX_FP_OP_COND_SHIFT);
- hw[2] = NV40_FP_OP_OPCODE_IS_BRANCH |
- (count << NV40_FP_OP_REP_COUNT1_SHIFT) |
- (count << NV40_FP_OP_REP_COUNT2_SHIFT) |
- (count << NV40_FP_OP_REP_COUNT3_SHIFT);
- hw[3] = 0; /* | end_offset */
- reloc.target = target;
- reloc.location = fpc->inst_offset + 3;
- util_dynarray_append(&fpc->label_relocs, struct nvfx_relocation, reloc);
- //util_dynarray_append(&fpc->loop_stack, unsigned, target);
-}
-
-/* warning: this only works forward, and probably only if not inside any IF */
-static void
-nv40_fp_bra(struct nvfx_fpc *fpc, unsigned target)
-{
- struct nvfx_relocation reloc;
- uint32_t *hw;
- fpc->inst_offset = fpc->fp->insn_len;
- grow_insns(fpc, 4);
- hw = &fpc->fp->insn[fpc->inst_offset];
- /* I really wonder why fp16 precision is used. Presumably the hardware ignores it? */
- hw[0] = (NV40_FP_OP_BRA_OPCODE_IF << NVFX_FP_OP_OPCODE_SHIFT) |
- NV40_FP_OP_OUT_NONE |
- (NVFX_FP_PRECISION_FP16 << NVFX_FP_OP_PRECISION_SHIFT);
- /* Use .xxxx swizzle so that we check only src[0].x*/
- hw[1] = (NVFX_SWZ_IDENTITY << NVFX_FP_OP_COND_SWZ_X_SHIFT) |
- (NVFX_FP_OP_COND_FL << NVFX_FP_OP_COND_SHIFT);
- hw[2] = NV40_FP_OP_OPCODE_IS_BRANCH; /* | else_offset */
- hw[3] = 0; /* | endif_offset */
- reloc.target = target;
- reloc.location = fpc->inst_offset + 2;
- util_dynarray_append(&fpc->label_relocs, struct nvfx_relocation, reloc);
- reloc.target = target;
- reloc.location = fpc->inst_offset + 3;
- util_dynarray_append(&fpc->label_relocs, struct nvfx_relocation, reloc);
-}
-
-static void
-nv40_fp_brk(struct nvfx_fpc *fpc)
-{
- uint32_t *hw;
- fpc->inst_offset = fpc->fp->insn_len;
- grow_insns(fpc, 4);
- hw = &fpc->fp->insn[fpc->inst_offset];
- /* I really wonder why fp16 precision is used. Presumably the hardware ignores it? */
- hw[0] = (NV40_FP_OP_BRA_OPCODE_BRK << NVFX_FP_OP_OPCODE_SHIFT) |
- NV40_FP_OP_OUT_NONE;
- /* Use .xxxx swizzle so that we check only src[0].x*/
- hw[1] = (NVFX_SWZ_IDENTITY << NVFX_FP_OP_COND_SWZ_X_SHIFT) |
- (NVFX_FP_OP_COND_TR << NVFX_FP_OP_COND_SHIFT);
- hw[2] = NV40_FP_OP_OPCODE_IS_BRANCH;
- hw[3] = 0;
-}
-
-static INLINE struct nvfx_src
-tgsi_src(struct nvfx_fpc *fpc, const struct tgsi_full_src_register *fsrc)
-{
- struct nvfx_src src;
-
- switch (fsrc->Register.File) {
- case TGSI_FILE_INPUT:
- if(fpc->pfp->info.input_semantic_name[fsrc->Register.Index] == TGSI_SEMANTIC_POSITION) {
- assert(fpc->pfp->info.input_semantic_index[fsrc->Register.Index] == 0);
- src.reg = nvfx_reg(NVFXSR_INPUT, NVFX_FP_OP_INPUT_SRC_POSITION);
- } else if(fpc->pfp->info.input_semantic_name[fsrc->Register.Index] == TGSI_SEMANTIC_COLOR) {
- if(fpc->pfp->info.input_semantic_index[fsrc->Register.Index] == 0)
- src.reg = nvfx_reg(NVFXSR_INPUT, NVFX_FP_OP_INPUT_SRC_COL0);
- else if(fpc->pfp->info.input_semantic_index[fsrc->Register.Index] == 1)
- src.reg = nvfx_reg(NVFXSR_INPUT, NVFX_FP_OP_INPUT_SRC_COL1);
- else
- assert(0);
- } else if(fpc->pfp->info.input_semantic_name[fsrc->Register.Index] == TGSI_SEMANTIC_FOG) {
- assert(fpc->pfp->info.input_semantic_index[fsrc->Register.Index] == 0);
- src.reg = nvfx_reg(NVFXSR_INPUT, NVFX_FP_OP_INPUT_SRC_FOGC);
- } else if(fpc->pfp->info.input_semantic_name[fsrc->Register.Index] == TGSI_SEMANTIC_FACE) {
- /* TODO: check this has the correct values */
- /* XXX: what do we do for nv30 here (assuming it lacks facing)?! */
- assert(fpc->pfp->info.input_semantic_index[fsrc->Register.Index] == 0);
- src.reg = nvfx_reg(NVFXSR_INPUT, NV40_FP_OP_INPUT_SRC_FACING);
- } else {
- assert(fpc->pfp->info.input_semantic_name[fsrc->Register.Index] == TGSI_SEMANTIC_GENERIC);
- src.reg = nvfx_reg(NVFXSR_RELOCATED, fpc->generic_to_slot[fpc->pfp->info.input_semantic_index[fsrc->Register.Index]]);
- }
- break;
- case TGSI_FILE_CONSTANT:
- src.reg = nvfx_reg(NVFXSR_CONST, fsrc->Register.Index);
- break;
- case TGSI_FILE_IMMEDIATE:
- assert(fsrc->Register.Index < fpc->nr_imm);
- src.reg = fpc->r_imm[fsrc->Register.Index];
- break;
- case TGSI_FILE_TEMPORARY:
- src.reg = fpc->r_temp[fsrc->Register.Index];
- break;
- /* NV40 fragprog result regs are just temps, so this is simple */
- case TGSI_FILE_OUTPUT:
- src.reg = fpc->r_result[fsrc->Register.Index];
- break;
- default:
- NOUVEAU_ERR("bad src file\n");
- src.reg.index = 0;
- src.reg.type = 0;
- break;
- }
-
- src.abs = fsrc->Register.Absolute;
- src.negate = fsrc->Register.Negate;
- src.swz[0] = fsrc->Register.SwizzleX;
- src.swz[1] = fsrc->Register.SwizzleY;
- src.swz[2] = fsrc->Register.SwizzleZ;
- src.swz[3] = fsrc->Register.SwizzleW;
- src.indirect = 0;
- src.indirect_reg = 0;
- src.indirect_swz = 0;
- return src;
-}
-
-static INLINE struct nvfx_reg
-tgsi_dst(struct nvfx_fpc *fpc, const struct tgsi_full_dst_register *fdst) {
- switch (fdst->Register.File) {
- case TGSI_FILE_OUTPUT:
- return fpc->r_result[fdst->Register.Index];
- case TGSI_FILE_TEMPORARY:
- return fpc->r_temp[fdst->Register.Index];
- case TGSI_FILE_NULL:
- return nvfx_reg(NVFXSR_NONE, 0);
- default:
- NOUVEAU_ERR("bad dst file %d\n", fdst->Register.File);
- return nvfx_reg(NVFXSR_NONE, 0);
- }
-}
-
-static INLINE int
-tgsi_mask(uint tgsi)
-{
- int mask = 0;
-
- if (tgsi & TGSI_WRITEMASK_X) mask |= NVFX_FP_MASK_X;
- if (tgsi & TGSI_WRITEMASK_Y) mask |= NVFX_FP_MASK_Y;
- if (tgsi & TGSI_WRITEMASK_Z) mask |= NVFX_FP_MASK_Z;
- if (tgsi & TGSI_WRITEMASK_W) mask |= NVFX_FP_MASK_W;
- return mask;
-}
-
-static boolean
-nvfx_fragprog_parse_instruction(struct nvfx_context* nvfx, struct nvfx_fpc *fpc,
- const struct tgsi_full_instruction *finst)
-{
- const struct nvfx_src none = nvfx_src(nvfx_reg(NVFXSR_NONE, 0));
- struct nvfx_insn insn;
- struct nvfx_src src[3], tmp;
- struct nvfx_reg dst;
- int mask, sat, unit = 0;
- int ai = -1, ci = -1, ii = -1;
- int i;
-
- if (finst->Instruction.Opcode == TGSI_OPCODE_END)
- return TRUE;
-
- for (i = 0; i < finst->Instruction.NumSrcRegs; i++) {
- const struct tgsi_full_src_register *fsrc;
-
- fsrc = &finst->Src[i];
- if (fsrc->Register.File == TGSI_FILE_TEMPORARY) {
- src[i] = tgsi_src(fpc, fsrc);
- }
- }
-
- for (i = 0; i < finst->Instruction.NumSrcRegs; i++) {
- const struct tgsi_full_src_register *fsrc;
-
- fsrc = &finst->Src[i];
-
- switch (fsrc->Register.File) {
- case TGSI_FILE_INPUT:
- if(fpc->pfp->info.input_semantic_name[fsrc->Register.Index] == TGSI_SEMANTIC_FOG && (0
- || fsrc->Register.SwizzleX == PIPE_SWIZZLE_ALPHA
- || fsrc->Register.SwizzleY == PIPE_SWIZZLE_ALPHA
- || fsrc->Register.SwizzleZ == PIPE_SWIZZLE_ALPHA
- || fsrc->Register.SwizzleW == PIPE_SWIZZLE_ALPHA
- )) {
- /* hardware puts 0 in fogcoord.w, but GL/Gallium want 1 there */
- struct nvfx_src addend = nvfx_src(nvfx_fp_imm(fpc, 0, 0, 0, 1));
- addend.swz[0] = fsrc->Register.SwizzleX;
- addend.swz[1] = fsrc->Register.SwizzleY;
- addend.swz[2] = fsrc->Register.SwizzleZ;
- addend.swz[3] = fsrc->Register.SwizzleW;
- src[i] = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, ADD, src[i].reg, NVFX_FP_MASK_ALL, tgsi_src(fpc, fsrc), addend, none));
- } else if (ai == -1 || ai == fsrc->Register.Index) {
- ai = fsrc->Register.Index;
- src[i] = tgsi_src(fpc, fsrc);
- } else {
- src[i] = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, MOV, src[i].reg, NVFX_FP_MASK_ALL, tgsi_src(fpc, fsrc), none, none));
- }
- break;
- case TGSI_FILE_CONSTANT:
- if ((ci == -1 && ii == -1) ||
- ci == fsrc->Register.Index) {
- ci = fsrc->Register.Index;
- src[i] = tgsi_src(fpc, fsrc);
- } else {
- src[i] = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, MOV, src[i].reg, NVFX_FP_MASK_ALL, tgsi_src(fpc, fsrc), none, none));
- }
- break;
- case TGSI_FILE_IMMEDIATE:
- if ((ci == -1 && ii == -1) ||
- ii == fsrc->Register.Index) {
- ii = fsrc->Register.Index;
- src[i] = tgsi_src(fpc, fsrc);
- } else {
- src[i] = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, MOV, src[i].reg, NVFX_FP_MASK_ALL, tgsi_src(fpc, fsrc), none, none));
- }
- break;
- case TGSI_FILE_TEMPORARY:
- /* handled above */
- break;
- case TGSI_FILE_SAMPLER:
- unit = fsrc->Register.Index;
- break;
- case TGSI_FILE_OUTPUT:
- break;
- default:
- NOUVEAU_ERR("bad src file\n");
- return FALSE;
- }
- }
-
- dst = tgsi_dst(fpc, &finst->Dst[0]);
- mask = tgsi_mask(finst->Dst[0].Register.WriteMask);
- sat = (finst->Instruction.Saturate == TGSI_SAT_ZERO_ONE);
-
- switch (finst->Instruction.Opcode) {
- case TGSI_OPCODE_ABS:
- nvfx_fp_emit(fpc, arith(sat, MOV, dst, mask, abs(src[0]), none, none));
- break;
- case TGSI_OPCODE_ADD:
- nvfx_fp_emit(fpc, arith(sat, ADD, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_CMP:
- insn = arith(0, MOV, none.reg, mask, src[0], none, none);
- insn.cc_update = 1;
- nvfx_fp_emit(fpc, insn);
-
- insn = arith(sat, MOV, dst, mask, src[2], none, none);
- insn.cc_test = NVFX_COND_GE;
- nvfx_fp_emit(fpc, insn);
-
- insn = arith(sat, MOV, dst, mask, src[1], none, none);
- insn.cc_test = NVFX_COND_LT;
- nvfx_fp_emit(fpc, insn);
- break;
- case TGSI_OPCODE_COS:
- nvfx_fp_emit(fpc, arith(sat, COS, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_DDX:
- if (mask & (NVFX_FP_MASK_Z | NVFX_FP_MASK_W)) {
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(sat, DDX, tmp.reg, NVFX_FP_MASK_X | NVFX_FP_MASK_Y, swz(src[0], Z, W, Z, W), none, none));
- nvfx_fp_emit(fpc, arith(0, MOV, tmp.reg, NVFX_FP_MASK_Z | NVFX_FP_MASK_W, swz(tmp, X, Y, X, Y), none, none));
- nvfx_fp_emit(fpc, arith(sat, DDX, tmp.reg, NVFX_FP_MASK_X | NVFX_FP_MASK_Y, src[0], none, none));
- nvfx_fp_emit(fpc, arith(0, MOV, dst, mask, tmp, none, none));
- } else {
- nvfx_fp_emit(fpc, arith(sat, DDX, dst, mask, src[0], none, none));
- }
- break;
- case TGSI_OPCODE_DDY:
- if (mask & (NVFX_FP_MASK_Z | NVFX_FP_MASK_W)) {
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(sat, DDY, tmp.reg, NVFX_FP_MASK_X | NVFX_FP_MASK_Y, swz(src[0], Z, W, Z, W), none, none));
- nvfx_fp_emit(fpc, arith(0, MOV, tmp.reg, NVFX_FP_MASK_Z | NVFX_FP_MASK_W, swz(tmp, X, Y, X, Y), none, none));
- nvfx_fp_emit(fpc, arith(sat, DDY, tmp.reg, NVFX_FP_MASK_X | NVFX_FP_MASK_Y, src[0], none, none));
- nvfx_fp_emit(fpc, arith(0, MOV, dst, mask, tmp, none, none));
- } else {
- nvfx_fp_emit(fpc, arith(sat, DDY, dst, mask, src[0], none, none));
- }
- break;
- case TGSI_OPCODE_DP2:
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, MUL, tmp.reg, NVFX_FP_MASK_X | NVFX_FP_MASK_Y, src[0], src[1], none));
- nvfx_fp_emit(fpc, arith(0, ADD, dst, mask, swz(tmp, X, X, X, X), swz(tmp, Y, Y, Y, Y), none));
- break;
- case TGSI_OPCODE_DP3:
- nvfx_fp_emit(fpc, arith(sat, DP3, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_DP4:
- nvfx_fp_emit(fpc, arith(sat, DP4, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_DPH:
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, DP3, tmp.reg, NVFX_FP_MASK_X, src[0], src[1], none));
- nvfx_fp_emit(fpc, arith(sat, ADD, dst, mask, swz(tmp, X, X, X, X), swz(src[1], W, W, W, W), none));
- break;
- case TGSI_OPCODE_DST:
- nvfx_fp_emit(fpc, arith(sat, DST, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_EX2:
- nvfx_fp_emit(fpc, arith(sat, EX2, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_FLR:
- nvfx_fp_emit(fpc, arith(sat, FLR, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_FRC:
- nvfx_fp_emit(fpc, arith(sat, FRC, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_KILP:
- nvfx_fp_emit(fpc, arith(0, KIL, none.reg, 0, none, none, none));
- break;
- case TGSI_OPCODE_KIL:
- insn = arith(0, MOV, none.reg, NVFX_FP_MASK_ALL, src[0], none, none);
- insn.cc_update = 1;
- nvfx_fp_emit(fpc, insn);
-
- insn = arith(0, KIL, none.reg, 0, none, none, none);
- insn.cc_test = NVFX_COND_LT;
- nvfx_fp_emit(fpc, insn);
- break;
- case TGSI_OPCODE_LG2:
- nvfx_fp_emit(fpc, arith(sat, LG2, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_LIT:
- if(!nvfx->is_nv4x)
- nvfx_fp_emit(fpc, arith(sat, LIT_NV30, dst, mask, src[0], src[1], src[2]));
- else {
- /* we use FLT_MIN, so that log2 never gives -infinity, and thus multiplication by
- * specular 0 always gives 0, so that ex2 gives 1, to satisfy the 0^0 = 1 requirement
- *
- * NOTE: if we start using half precision, we might need an fp16 FLT_MIN here instead
- */
- struct nvfx_src maxs = nvfx_src(nvfx_fp_imm(fpc, 0, FLT_MIN, 0, 0));
- tmp = nvfx_src(temp(fpc));
- if (ci>= 0 || ii >= 0) {
- nvfx_fp_emit(fpc, arith(0, MOV, tmp.reg, NVFX_FP_MASK_X | NVFX_FP_MASK_Y, maxs, none, none));
- maxs = tmp;
- }
- nvfx_fp_emit(fpc, arith(0, MAX, tmp.reg, NVFX_FP_MASK_Y | NVFX_FP_MASK_W, swz(src[0], X, X, X, Y), swz(maxs, X, X, Y, Y), none));
- nvfx_fp_emit(fpc, arith(0, LG2, tmp.reg, NVFX_FP_MASK_W, swz(tmp, W, W, W, W), none, none));
- nvfx_fp_emit(fpc, arith(0, MUL, tmp.reg, NVFX_FP_MASK_W, swz(tmp, W, W, W, W), swz(src[0], W, W, W, W), none));
- nvfx_fp_emit(fpc, arith(sat, LITEX2_NV40, dst, mask, swz(tmp, Y, Y, W, W), none, none));
- }
- break;
- case TGSI_OPCODE_LRP:
- if(!nvfx->is_nv4x)
- nvfx_fp_emit(fpc, arith(sat, LRP_NV30, dst, mask, src[0], src[1], src[2]));
- else {
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, MAD, tmp.reg, mask, neg(src[0]), src[2], src[2]));
- nvfx_fp_emit(fpc, arith(sat, MAD, dst, mask, src[0], src[1], tmp));
- }
- break;
- case TGSI_OPCODE_MAD:
- nvfx_fp_emit(fpc, arith(sat, MAD, dst, mask, src[0], src[1], src[2]));
- break;
- case TGSI_OPCODE_MAX:
- nvfx_fp_emit(fpc, arith(sat, MAX, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_MIN:
- nvfx_fp_emit(fpc, arith(sat, MIN, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_MOV:
- nvfx_fp_emit(fpc, arith(sat, MOV, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_MUL:
- nvfx_fp_emit(fpc, arith(sat, MUL, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_NOP:
- break;
- case TGSI_OPCODE_POW:
- if(!nvfx->is_nv4x)
- nvfx_fp_emit(fpc, arith(sat, POW_NV30, dst, mask, src[0], src[1], none));
- else {
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, LG2, tmp.reg, NVFX_FP_MASK_X, swz(src[0], X, X, X, X), none, none));
- nvfx_fp_emit(fpc, arith(0, MUL, tmp.reg, NVFX_FP_MASK_X, swz(tmp, X, X, X, X), swz(src[1], X, X, X, X), none));
- nvfx_fp_emit(fpc, arith(sat, EX2, dst, mask, swz(tmp, X, X, X, X), none, none));
- }
- break;
- case TGSI_OPCODE_RCP:
- nvfx_fp_emit(fpc, arith(sat, RCP, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_RFL:
- if(!nvfx->is_nv4x)
- nvfx_fp_emit(fpc, arith(0, RFL_NV30, dst, mask, src[0], src[1], none));
- else {
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, DP3, tmp.reg, NVFX_FP_MASK_X, src[0], src[0], none));
- nvfx_fp_emit(fpc, arith(0, DP3, tmp.reg, NVFX_FP_MASK_Y, src[0], src[1], none));
- insn = arith(0, DIV, tmp.reg, NVFX_FP_MASK_Z, swz(tmp, Y, Y, Y, Y), swz(tmp, X, X, X, X), none);
- insn.scale = NVFX_FP_OP_DST_SCALE_2X;
- nvfx_fp_emit(fpc, insn);
- nvfx_fp_emit(fpc, arith(sat, MAD, dst, mask, swz(tmp, Z, Z, Z, Z), src[0], neg(src[1])));
- }
- break;
- case TGSI_OPCODE_RSQ:
- if(!nvfx->is_nv4x)
- nvfx_fp_emit(fpc, arith(sat, RSQ_NV30, dst, mask, abs(swz(src[0], X, X, X, X)), none, none));
- else {
- tmp = nvfx_src(temp(fpc));
- insn = arith(0, LG2, tmp.reg, NVFX_FP_MASK_X, abs(swz(src[0], X, X, X, X)), none, none);
- insn.scale = NVFX_FP_OP_DST_SCALE_INV_2X;
- nvfx_fp_emit(fpc, insn);
- nvfx_fp_emit(fpc, arith(sat, EX2, dst, mask, neg(swz(tmp, X, X, X, X)), none, none));
- }
- break;
- case TGSI_OPCODE_SCS:
- /* avoid overwriting the source */
- if(src[0].swz[NVFX_SWZ_X] != NVFX_SWZ_X)
- {
- if (mask & NVFX_FP_MASK_X)
- nvfx_fp_emit(fpc, arith(sat, COS, dst, NVFX_FP_MASK_X, swz(src[0], X, X, X, X), none, none));
- if (mask & NVFX_FP_MASK_Y)
- nvfx_fp_emit(fpc, arith(sat, SIN, dst, NVFX_FP_MASK_Y, swz(src[0], X, X, X, X), none, none));
- }
- else
- {
- if (mask & NVFX_FP_MASK_Y)
- nvfx_fp_emit(fpc, arith(sat, SIN, dst, NVFX_FP_MASK_Y, swz(src[0], X, X, X, X), none, none));
- if (mask & NVFX_FP_MASK_X)
- nvfx_fp_emit(fpc, arith(sat, COS, dst, NVFX_FP_MASK_X, swz(src[0], X, X, X, X), none, none));
- }
- break;
- case TGSI_OPCODE_SEQ:
- nvfx_fp_emit(fpc, arith(sat, SEQ, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SFL:
- nvfx_fp_emit(fpc, arith(sat, SFL, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SGE:
- nvfx_fp_emit(fpc, arith(sat, SGE, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SGT:
- nvfx_fp_emit(fpc, arith(sat, SGT, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SIN:
- nvfx_fp_emit(fpc, arith(sat, SIN, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_SLE:
- nvfx_fp_emit(fpc, arith(sat, SLE, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SLT:
- nvfx_fp_emit(fpc, arith(sat, SLT, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SNE:
- nvfx_fp_emit(fpc, arith(sat, SNE, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SSG:
- {
- struct nvfx_src minones = swz(nvfx_src(nvfx_fp_imm(fpc, -1, -1, -1, -1)), X, X, X, X);
-
- insn = arith(sat, MOV, dst, mask, src[0], none, none);
- insn.cc_update = 1;
- nvfx_fp_emit(fpc, insn);
-
- insn = arith(0, STR, dst, mask, none, none, none);
- insn.cc_test = NVFX_COND_GT;
- nvfx_fp_emit(fpc, insn);
-
- if(!sat) {
- insn = arith(0, MOV, dst, mask, minones, none, none);
- insn.cc_test = NVFX_COND_LT;
- nvfx_fp_emit(fpc, insn);
- }
- break;
- }
- case TGSI_OPCODE_STR:
- nvfx_fp_emit(fpc, arith(sat, STR, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SUB:
- nvfx_fp_emit(fpc, arith(sat, ADD, dst, mask, src[0], neg(src[1]), none));
- break;
- case TGSI_OPCODE_TEX:
- nvfx_fp_emit(fpc, tex(sat, TEX, unit, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_TRUNC:
- tmp = nvfx_src(temp(fpc));
- insn = arith(0, MOV, none.reg, mask, src[0], none, none);
- insn.cc_update = 1;
- nvfx_fp_emit(fpc, insn);
-
- nvfx_fp_emit(fpc, arith(0, FLR, tmp.reg, mask, abs(src[0]), none, none));
- nvfx_fp_emit(fpc, arith(sat, MOV, dst, mask, tmp, none, none));
-
- insn = arith(sat, MOV, dst, mask, neg(tmp), none, none);
- insn.cc_test = NVFX_COND_LT;
- nvfx_fp_emit(fpc, insn);
- break;
- case TGSI_OPCODE_TXB:
- nvfx_fp_emit(fpc, tex(sat, TXB, unit, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_TXL:
- if(nvfx->is_nv4x)
- nvfx_fp_emit(fpc, tex(sat, TXL_NV40, unit, dst, mask, src[0], none, none));
- else /* unsupported on nv30, use TEX and hope they like it */
- nvfx_fp_emit(fpc, tex(sat, TEX, unit, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_TXP:
- nvfx_fp_emit(fpc, tex(sat, TXP, unit, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_XPD:
- tmp = nvfx_src(temp(fpc));
- nvfx_fp_emit(fpc, arith(0, MUL, tmp.reg, mask, swz(src[0], Z, X, Y, Y), swz(src[1], Y, Z, X, X), none));
- nvfx_fp_emit(fpc, arith(sat, MAD, dst, (mask & ~NVFX_FP_MASK_W), swz(src[0], Y, Z, X, X), swz(src[1], Z, X, Y, Y), neg(tmp)));
- break;
-
- case TGSI_OPCODE_IF:
- // MOVRC0 R31 (TR0.xyzw), R<src>:
- // IF (NE.xxxx) ELSE <else> END <end>
- if(!nvfx->use_nv4x)
- goto nv3x_cflow;
- nv40_fp_if(fpc, src[0]);
- break;
-
- case TGSI_OPCODE_ELSE:
- {
- uint32_t *hw;
- if(!nvfx->use_nv4x)
- goto nv3x_cflow;
- assert(util_dynarray_contains(&fpc->if_stack, unsigned));
- hw = &fpc->fp->insn[util_dynarray_top(&fpc->if_stack, unsigned)];
- hw[2] = NV40_FP_OP_OPCODE_IS_BRANCH | fpc->fp->insn_len;
- break;
- }
-
- case TGSI_OPCODE_ENDIF:
- {
- uint32_t *hw;
- if(!nvfx->use_nv4x)
- goto nv3x_cflow;
- assert(util_dynarray_contains(&fpc->if_stack, unsigned));
- hw = &fpc->fp->insn[util_dynarray_pop(&fpc->if_stack, unsigned)];
- if(!hw[2])
- hw[2] = NV40_FP_OP_OPCODE_IS_BRANCH | fpc->fp->insn_len;
- hw[3] = fpc->fp->insn_len;
- break;
- }
-
- case TGSI_OPCODE_BRA:
- /* This can in limited cases be implemented with an IF with the else and endif labels pointing to the target */
- /* no state tracker uses this, so don't implement this for now */
- assert(0);
- nv40_fp_bra(fpc, finst->Label.Label);
- break;
-
- case TGSI_OPCODE_BGNSUB:
- case TGSI_OPCODE_ENDSUB:
- /* nothing to do here */
- break;
-
- case TGSI_OPCODE_CAL:
- if(!nvfx->use_nv4x)
- goto nv3x_cflow;
- nv40_fp_cal(fpc, finst->Label.Label);
- break;
-
- case TGSI_OPCODE_RET:
- if(!nvfx->use_nv4x)
- goto nv3x_cflow;
- nv40_fp_ret(fpc);
- break;
-
- case TGSI_OPCODE_BGNLOOP:
- if(!nvfx->use_nv4x)
- goto nv3x_cflow;
- /* TODO: we should support using two nested REPs to allow a > 255 iteration count */
- nv40_fp_rep(fpc, 255, finst->Label.Label);
- break;
-
- case TGSI_OPCODE_ENDLOOP:
- break;
-
- case TGSI_OPCODE_BRK:
- if(!nvfx->use_nv4x)
- goto nv3x_cflow;
- nv40_fp_brk(fpc);
- break;
-
- case TGSI_OPCODE_CONT:
- {
- static int warned = 0;
- if(!warned) {
- NOUVEAU_ERR("Sorry, the continue keyword is not implemented: ignoring it.\n");
- warned = 1;
- }
- break;
- }
-
- default:
- NOUVEAU_ERR("invalid opcode %d\n", finst->Instruction.Opcode);
- return FALSE;
- }
-
-out:
- release_temps(fpc);
- return TRUE;
-nv3x_cflow:
- {
- static int warned = 0;
- if(!warned) {
- NOUVEAU_ERR(
- "Sorry, control flow instructions are not supported in hardware on nv3x: ignoring them\n"
- "If rendering is incorrect, try to disable GLSL support in the application.\n");
- warned = 1;
- }
- }
- goto out;
-}
-
-static boolean
-nvfx_fragprog_parse_decl_output(struct nvfx_context* nvfx, struct nvfx_fpc *fpc,
- const struct tgsi_full_declaration *fdec)
-{
- unsigned idx = fdec->Range.First;
- unsigned hw;
-
- switch (fdec->Semantic.Name) {
- case TGSI_SEMANTIC_POSITION:
- hw = 1;
- break;
- case TGSI_SEMANTIC_COLOR:
- hw = ~0;
- switch (fdec->Semantic.Index) {
- case 0: hw = 0; break;
- case 1: hw = 2; break;
- case 2: hw = 3; break;
- case 3: hw = 4; break;
- }
- if(hw > ((nvfx->use_nv4x) ? 4 : 2)) {
- NOUVEAU_ERR("bad rcol index\n");
- return FALSE;
- }
- break;
- default:
- NOUVEAU_ERR("bad output semantic\n");
- return FALSE;
- }
-
- fpc->r_result[idx] = nvfx_reg(NVFXSR_OUTPUT, hw);
- fpc->r_temps |= (1ULL << hw);
- return TRUE;
-}
-
-static boolean
-nvfx_fragprog_prepare(struct nvfx_context* nvfx, struct nvfx_fpc *fpc)
-{
- struct tgsi_parse_context p;
- int high_temp = -1, i;
- struct util_semantic_set set;
- unsigned num_texcoords = nvfx->use_nv4x ? 10 : 8;
-
- fpc->fp->num_slots = util_semantic_set_from_program_file(&set, fpc->pfp->pipe.tokens, TGSI_FILE_INPUT);
- if(fpc->fp->num_slots > num_texcoords)
- return FALSE;
- util_semantic_layout_from_set(fpc->fp->slot_to_generic, &set, 0, num_texcoords);
- util_semantic_table_from_layout(fpc->generic_to_slot, sizeof fpc->generic_to_slot,
- fpc->fp->slot_to_generic, 0, num_texcoords);
-
- memset(fpc->fp->slot_to_fp_input, 0xff, sizeof(fpc->fp->slot_to_fp_input));
-
- fpc->r_imm = CALLOC(fpc->pfp->info.immediate_count, sizeof(struct nvfx_reg));
-
- tgsi_parse_init(&p, fpc->pfp->pipe.tokens);
- while (!tgsi_parse_end_of_tokens(&p)) {
- const union tgsi_full_token *tok = &p.FullToken;
-
- tgsi_parse_token(&p);
- switch(tok->Token.Type) {
- case TGSI_TOKEN_TYPE_DECLARATION:
- {
- const struct tgsi_full_declaration *fdec;
- fdec = &p.FullToken.FullDeclaration;
- switch (fdec->Declaration.File) {
- case TGSI_FILE_OUTPUT:
- if (!nvfx_fragprog_parse_decl_output(nvfx, fpc, fdec))
- goto out_err;
- break;
- case TGSI_FILE_TEMPORARY:
- if (fdec->Range.Last > high_temp) {
- high_temp =
- fdec->Range.Last;
- }
- break;
- default:
- break;
- }
- }
- break;
- case TGSI_TOKEN_TYPE_IMMEDIATE:
- {
- struct tgsi_full_immediate *imm;
-
- imm = &p.FullToken.FullImmediate;
- assert(imm->Immediate.DataType == TGSI_IMM_FLOAT32);
- assert(fpc->nr_imm < fpc->pfp->info.immediate_count);
-
- fpc->r_imm[fpc->nr_imm++] = nvfx_fp_imm(fpc, imm->u[0].Float, imm->u[1].Float, imm->u[2].Float, imm->u[3].Float);
- break;
- }
- default:
- break;
- }
- }
- tgsi_parse_free(&p);
-
- if (++high_temp) {
- fpc->r_temp = CALLOC(high_temp, sizeof(struct nvfx_reg));
- for (i = 0; i < high_temp; i++)
- fpc->r_temp[i] = temp(fpc);
- fpc->r_temps_discard = 0ULL;
- }
-
- return TRUE;
-
-out_err:
- if (fpc->r_temp) {
- FREE(fpc->r_temp);
- fpc->r_temp = NULL;
- }
- tgsi_parse_free(&p);
- return FALSE;
-}
-
-DEBUG_GET_ONCE_BOOL_OPTION(nvfx_dump_fp, "NVFX_DUMP_FP", FALSE)
-
-static struct nvfx_fragment_program*
-nvfx_fragprog_translate(struct nvfx_context *nvfx,
- struct nvfx_pipe_fragment_program *pfp,
- boolean emulate_sprite_flipping)
-{
- struct tgsi_parse_context parse;
- struct nvfx_fpc *fpc = NULL;
- struct util_dynarray insns;
- struct nvfx_fragment_program* fp = NULL;
- const int min_size = 4096;
-
- fp = CALLOC_STRUCT(nvfx_fragment_program);
- if(!fp)
- goto out_err;
-
- fpc = CALLOC_STRUCT(nvfx_fpc);
- if (!fpc)
- goto out_err;
-
- fpc->max_temps = nvfx->use_nv4x ? 48 : 32;
- fpc->pfp = pfp;
- fpc->fp = fp;
- fpc->num_regs = 2;
-
- for (unsigned i = 0; i < pfp->info.num_properties; ++i) {
- if (pfp->info.properties[i].name == TGSI_PROPERTY_FS_COORD_ORIGIN) {
- if(pfp->info.properties[i].data[0])
- fp->coord_conventions |= NV30_3D_COORD_CONVENTIONS_ORIGIN_INVERTED;
- } else if (pfp->info.properties[i].name == TGSI_PROPERTY_FS_COORD_PIXEL_CENTER) {
- if(pfp->info.properties[i].data[0])
- fp->coord_conventions |= NV30_3D_COORD_CONVENTIONS_CENTER_INTEGER;
- }
- }
-
- if (!nvfx_fragprog_prepare(nvfx, fpc))
- goto out_err;
-
- tgsi_parse_init(&parse, pfp->pipe.tokens);
- util_dynarray_init(&insns);
-
- if(emulate_sprite_flipping)
- {
- struct nvfx_reg reg = temp(fpc);
- struct nvfx_src sprite_input = nvfx_src(nvfx_reg(NVFXSR_RELOCATED, fp->num_slots));
- struct nvfx_src imm = nvfx_src(nvfx_fp_imm(fpc, 1, -1, 0, 0));
-
- fpc->sprite_coord_temp = reg.index;
- fpc->r_temps_discard = 0ULL;
- nvfx_fp_emit(fpc, arith(0, MAD, reg, NVFX_FP_MASK_ALL, sprite_input, swz(imm, X, Y, X, X), swz(imm, Z, X, Z, Z)));
- }
-
- while (!tgsi_parse_end_of_tokens(&parse)) {
- tgsi_parse_token(&parse);
-
- switch (parse.FullToken.Token.Type) {
- case TGSI_TOKEN_TYPE_INSTRUCTION:
- {
- const struct tgsi_full_instruction *finst;
-
- util_dynarray_append(&insns, unsigned, fp->insn_len);
- finst = &parse.FullToken.FullInstruction;
- if (!nvfx_fragprog_parse_instruction(nvfx, fpc, finst))
- goto out_err;
- }
- break;
- default:
- break;
- }
- }
- util_dynarray_append(&insns, unsigned, fp->insn_len);
-
- for(unsigned i = 0; i < fpc->label_relocs.size; i += sizeof(struct nvfx_relocation))
- {
- struct nvfx_relocation* label_reloc = (struct nvfx_relocation*)((char*)fpc->label_relocs.data + i);
- fp->insn[label_reloc->location] |= ((unsigned*)insns.data)[label_reloc->target];
- }
- util_dynarray_fini(&insns);
-
- if(!nvfx->is_nv4x)
- fp->fp_control |= (fpc->num_regs-1)/2;
- else
- fp->fp_control |= fpc->num_regs << NV40_3D_FP_CONTROL_TEMP_COUNT__SHIFT;
-
- /* Terminate final instruction */
- if(fp->insn)
- fp->insn[fpc->inst_offset] |= 0x00000001;
-
- /* Append NOP + END instruction for branches to the end of the program */
- fpc->inst_offset = fp->insn_len;
- grow_insns(fpc, 4);
- fp->insn[fpc->inst_offset + 0] = 0x00000001;
- fp->insn[fpc->inst_offset + 1] = 0x00000000;
- fp->insn[fpc->inst_offset + 2] = 0x00000000;
- fp->insn[fpc->inst_offset + 3] = 0x00000000;
-
- if(debug_get_option_nvfx_dump_fp())
- {
- debug_printf("\n");
- tgsi_dump(pfp->pipe.tokens, 0);
-
- debug_printf("\n%s fragment program:\n", nvfx->is_nv4x ? "nv4x" : "nv3x");
- for (unsigned i = 0; i < fp->insn_len; i += 4)
- debug_printf("%3u: %08x %08x %08x %08x\n", i >> 2, fp->insn[i], fp->insn[i + 1], fp->insn[i + 2], fp->insn[i + 3]);
- debug_printf("\n");
- }
-
- fp->prog_size = (fp->insn_len * 4 + 63) & ~63;
-
- if(fp->prog_size >= min_size)
- fp->progs_per_bo = 1;
- else
- fp->progs_per_bo = min_size / fp->prog_size;
- fp->bo_prog_idx = fp->progs_per_bo - 1;
-
-out:
- tgsi_parse_free(&parse);
- if(fpc)
- {
- if (fpc->r_temp)
- FREE(fpc->r_temp);
- util_dynarray_fini(&fpc->if_stack);
- util_dynarray_fini(&fpc->label_relocs);
- util_dynarray_fini(&fpc->imm_data);
- //util_dynarray_fini(&fpc->loop_stack);
- FREE(fpc);
- }
- return fp;
-
-out_err:
- _debug_printf("Error: failed to compile this fragment program:\n");
- tgsi_dump(pfp->pipe.tokens, 0);
-
- if(fp)
- {
- FREE(fp);
- fp = NULL;
- }
- goto out;
-}
-
-static inline void
-nvfx_fp_memcpy(void* dst, const void* src, size_t len)
-{
-#ifndef PIPE_ARCH_BIG_ENDIAN
- memcpy(dst, src, len);
-#else
- size_t i;
- for(i = 0; i < len; i += 4) {
- uint32_t v = *(uint32_t*)((char*)src + i);
- *(uint32_t*)((char*)dst + i) = (v >> 16) | (v << 16);
- }
-#endif
-}
-
-/* The hardware only supports immediate constants inside the fragment program,
- * and at least on nv30 doesn't support an indirect linkage table.
- *
- * Hence, we need to patch the fragment program itself both to update constants
- * and update linkage.
- *
- * Using a single fragment program would entail unacceptable stalls if the GPU is
- * already rendering with that fragment program.
- * Thus, we instead use a "rotating queue" of buffer objects, each of which is
- * packed with multiple versions of the same program.
- *
- * Whenever we need to patch something, we move to the next program and
- * patch it. If all buffer objects are in use by the GPU, we allocate another one,
- * expanding the queue.
- *
- * As an additional optimization, we record when all the programs have the
- * current input slot configuration, and at that point we stop patching inputs.
- * This happens, for instance, if a given fragment program is always used with
- * the same vertex program (i.e. always with GLSL), or if the layouts match
- * enough (non-GLSL).
- *
- * Note that instead of using multiple programs, we could push commands
- * on the FIFO to patch a single program: it's not fully clear which option is
- * faster, but my guess is that the current way is faster.
- *
- * We also track the previous slot assignments for each version and don't
- * patch if they are the same (this could perhaps be removed).
- */
-
-void
-nvfx_fragprog_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct nvfx_pipe_fragment_program *pfp = nvfx->fragprog;
- struct nvfx_vertex_program* vp;
-
- // TODO: the multiplication by point_quad_rasterization is probably superfluous
- unsigned sprite_coord_enable = nvfx->rasterizer->pipe.point_quad_rasterization * nvfx->rasterizer->pipe.sprite_coord_enable;
-
- boolean emulate_sprite_flipping = sprite_coord_enable && nvfx->rasterizer->pipe.sprite_coord_mode;
- unsigned key = emulate_sprite_flipping;
- struct nvfx_fragment_program* fp;
-
- fp = pfp->fps[key];
- if (!fp)
- {
- fp = nvfx_fragprog_translate(nvfx, pfp, emulate_sprite_flipping);
-
- if(!fp)
- {
- if(!nvfx->dummy_fs)
- {
- struct ureg_program *ureg = ureg_create( TGSI_PROCESSOR_FRAGMENT );
- if (ureg)
- {
- ureg_END( ureg );
- nvfx->dummy_fs = ureg_create_shader_and_destroy( ureg, &nvfx->pipe );
- }
-
- if(!nvfx->dummy_fs)
- {
- _debug_printf("Error: unable to create a dummy fragment shader: aborting.");
- abort();
- }
- }
-
- fp = nvfx_fragprog_translate(nvfx, nvfx->dummy_fs, FALSE);
- emulate_sprite_flipping = FALSE;
-
- if(!fp)
- {
- _debug_printf("Error: unable to compile even a dummy fragment shader: aborting.");
- abort();
- }
- }
-
- pfp->fps[key] = fp;
- }
-
- vp = nvfx->hw_vertprog;
-
- if (fp->last_vp_id != vp->id || fp->last_sprite_coord_enable != sprite_coord_enable) {
- int sprite_real_input = -1;
- int sprite_reloc_input;
- unsigned i;
- fp->last_vp_id = vp->id;
- fp->last_sprite_coord_enable = sprite_coord_enable;
-
- if(sprite_coord_enable)
- {
- sprite_real_input = vp->sprite_fp_input;
- if(sprite_real_input < 0)
- {
- unsigned used_texcoords = 0;
- for(unsigned i = 0; i < fp->num_slots; ++i) {
- unsigned generic = fp->slot_to_generic[i];
- if((generic < 32) && !((1 << generic) & sprite_coord_enable))
- {
- unsigned char slot_mask = vp->generic_to_fp_input[generic];
- if(slot_mask >= 0xf0)
- used_texcoords |= 1 << ((slot_mask & 0xf) - NVFX_FP_OP_INPUT_SRC_TC0);
- }
- }
-
- sprite_real_input = NVFX_FP_OP_INPUT_SRC_TC(__builtin_ctz(~used_texcoords));
- }
-
- fp->point_sprite_control |= (1 << (sprite_real_input - NVFX_FP_OP_INPUT_SRC_TC0 + 8));
- }
- else
- fp->point_sprite_control = 0;
-
- if(emulate_sprite_flipping)
- sprite_reloc_input = 0;
- else
- sprite_reloc_input = sprite_real_input;
-
- for(i = 0; i < fp->num_slots; ++i) {
- unsigned generic = fp->slot_to_generic[i];
- if((generic < 32) && ((1 << generic) & sprite_coord_enable))
- {
- if(fp->slot_to_fp_input[i] != sprite_reloc_input)
- goto update_slots;
- }
- else
- {
- unsigned char slot_mask = vp->generic_to_fp_input[generic];
- if((slot_mask >> 4) & (slot_mask ^ fp->slot_to_fp_input[i]))
- goto update_slots;
- }
- }
-
- if(emulate_sprite_flipping)
- {
- if(fp->slot_to_fp_input[fp->num_slots] != sprite_real_input)
- goto update_slots;
- }
-
- if(0)
- {
-update_slots:
- /* optimization: we start updating from the slot we found the first difference in */
- for(; i < fp->num_slots; ++i)
- {
- unsigned generic = fp->slot_to_generic[i];
- if((generic < 32) && ((1 << generic) & sprite_coord_enable))
- fp->slot_to_fp_input[i] = sprite_reloc_input;
- else
- fp->slot_to_fp_input[i] = vp->generic_to_fp_input[generic] & 0xf;
- }
-
- fp->slot_to_fp_input[fp->num_slots] = sprite_real_input;
-
- if(nvfx->is_nv4x)
- {
- fp->or = 0;
- for(i = 0; i <= fp->num_slots; ++i) {
- unsigned fp_input = fp->slot_to_fp_input[i];
- if(fp_input == NVFX_FP_OP_INPUT_SRC_TC(8))
- fp->or |= (1 << 12);
- else if(fp_input == NVFX_FP_OP_INPUT_SRC_TC(9))
- fp->or |= (1 << 13);
- else if(fp_input >= NVFX_FP_OP_INPUT_SRC_TC(0) && fp_input <= NVFX_FP_OP_INPUT_SRC_TC(7))
- fp->or |= (1 << (fp_input - NVFX_FP_OP_INPUT_SRC_TC0 + 14));
- }
- }
-
- fp->progs_left_with_obsolete_slot_assignments = fp->progs;
- goto update;
- }
- }
-
- /* We must update constants even on "just" fragprog changes, because
- * we don't check whether the current constant buffer matches the latest
- * one bound to this fragment program.
- * Doing such a check would likely be a pessimization.
- */
- if ((nvfx->hw_fragprog != fp) || (nvfx->dirty & (NVFX_NEW_FRAGPROG | NVFX_NEW_FRAGCONST))) {
- int offset;
- uint32_t* fpmap;
-
-update:
- ++fp->bo_prog_idx;
- if(fp->bo_prog_idx >= fp->progs_per_bo)
- {
- if(fp->fpbo && !nouveau_bo_busy(fp->fpbo->next->bo, NOUVEAU_BO_WR))
- {
- fp->fpbo = fp->fpbo->next;
- }
- else
- {
- struct nvfx_fragment_program_bo* fpbo = os_malloc_aligned(sizeof(struct nvfx_fragment_program) + (fp->prog_size + 8) * fp->progs_per_bo, 16);
- uint8_t* map;
- uint8_t* buf;
-
- fpbo->slots = (unsigned char*)&fpbo->insn[(fp->prog_size) * fp->progs_per_bo];
- memset(fpbo->slots, 0, 8 * fp->progs_per_bo);
- if(fp->fpbo)
- {
- fpbo->next = fp->fpbo->next;
- fp->fpbo->next = fpbo;
- }
- else
- fpbo->next = fpbo;
- fp->fpbo = fpbo;
- fpbo->bo = 0;
- fp->progs += fp->progs_per_bo;
- fp->progs_left_with_obsolete_slot_assignments += fp->progs_per_bo;
- nouveau_bo_new(nvfx->screen->base.device, NOUVEAU_BO_VRAM | NOUVEAU_BO_MAP, 64, fp->prog_size * fp->progs_per_bo, &fpbo->bo);
- nouveau_bo_map(fpbo->bo, NOUVEAU_BO_NOSYNC);
-
- map = fpbo->bo->map;
- buf = (uint8_t*)fpbo->insn;
- for(unsigned i = 0; i < fp->progs_per_bo; ++i)
- {
- memcpy(buf, fp->insn, fp->insn_len * 4);
- nvfx_fp_memcpy(map, fp->insn, fp->insn_len * 4);
- map += fp->prog_size;
- buf += fp->prog_size;
- }
- }
- fp->bo_prog_idx = 0;
- }
-
- offset = fp->bo_prog_idx * fp->prog_size;
- fpmap = (uint32_t*)((char*)fp->fpbo->bo->map + offset);
-
- if(nvfx->constbuf[PIPE_SHADER_FRAGMENT]) {
- struct pipe_resource* constbuf = nvfx->constbuf[PIPE_SHADER_FRAGMENT];
- uint32_t* map = (uint32_t*)nvfx_buffer(constbuf)->data;
- uint32_t* fpmap = (uint32_t*)((char*)fp->fpbo->bo->map + offset);
- uint32_t* buf = (uint32_t*)((char*)fp->fpbo->insn + offset);
- int i;
- for (i = 0; i < fp->nr_consts; ++i) {
- unsigned off = fp->consts[i].offset;
- unsigned idx = fp->consts[i].index * 4;
-
- /* TODO: is checking a good idea? */
- if(memcmp(&buf[off], &map[idx], 4 * sizeof(uint32_t))) {
- memcpy(&buf[off], &map[idx], 4 * sizeof(uint32_t));
- nvfx_fp_memcpy(&fpmap[off], &map[idx], 4 * sizeof(uint32_t));
- }
- }
- }
-
- /* we only do this if we aren't sure that all program versions have the
- * current slot assignments, otherwise we just update constants for speed
- */
- if(fp->progs_left_with_obsolete_slot_assignments) {
- unsigned char* fpbo_slots = &fp->fpbo->slots[fp->bo_prog_idx * 8];
- /* also relocate sprite coord slot, if any */
- for(unsigned i = 0; i <= fp->num_slots; ++i) {
- unsigned value = fp->slot_to_fp_input[i];;
- if(value != fpbo_slots[i]) {
- unsigned* p;
- unsigned* begin = (unsigned*)fp->slot_relocations[i].data;
- unsigned* end = (unsigned*)((char*)fp->slot_relocations[i].data + fp->slot_relocations[i].size);
- //printf("fp %p reloc slot %u/%u: %u -> %u\n", fp, i, fp->num_slots, fpbo_slots[i], value);
- if(value == 0)
- {
- /* was relocated to an input, switch type to temporary */
- for(p = begin; p != end; ++p) {
- unsigned off = *p;
- unsigned dw = fp->insn[off];
- dw &=~ NVFX_FP_REG_TYPE_MASK;
- //printf("reloc_tmp at %x\n", off);
- nvfx_fp_memcpy(&fpmap[off], &dw, sizeof(dw));
- }
- } else {
- if(!fpbo_slots[i])
- {
- /* was relocated to a temporary, switch type to input */
- for(p= begin; p != end; ++p) {
- unsigned off = *p;
- unsigned dw = fp->insn[off];
- //printf("reloc_in at %x\n", off);
- dw |= NVFX_FP_REG_TYPE_INPUT << NVFX_FP_REG_TYPE_SHIFT;
- nvfx_fp_memcpy(&fpmap[off], &dw, sizeof(dw));
- }
- }
-
- /* set the correct input index */
- for(p = begin; p != end; ++p) {
- unsigned off = *p & ~3;
- unsigned dw = fp->insn[off];
- //printf("reloc&~3 at %x\n", off);
- dw = (dw & ~NVFX_FP_OP_INPUT_SRC_MASK) | (value << NVFX_FP_OP_INPUT_SRC_SHIFT);
- nvfx_fp_memcpy(&fpmap[off], &dw, sizeof(dw));
- }
- }
- fpbo_slots[i] = value;
- }
- }
- --fp->progs_left_with_obsolete_slot_assignments;
- }
-
- nvfx->hw_fragprog = fp;
-
- MARK_RING(chan, 8, 1);
- BEGIN_RING(chan, eng3d, NV30_3D_FP_ACTIVE_PROGRAM, 1);
- OUT_RELOC(chan, fp->fpbo->bo, offset, NOUVEAU_BO_VRAM |
- NOUVEAU_BO_GART | NOUVEAU_BO_RD | NOUVEAU_BO_LOW |
- NOUVEAU_BO_OR, NV30_3D_FP_ACTIVE_PROGRAM_DMA0,
- NV30_3D_FP_ACTIVE_PROGRAM_DMA1);
- BEGIN_RING(chan, eng3d, NV30_3D_FP_CONTROL, 1);
- OUT_RING(chan, fp->fp_control);
- if(!nvfx->is_nv4x) {
- BEGIN_RING(chan, eng3d, NV30_3D_FP_REG_CONTROL, 1);
- OUT_RING(chan, (1<<16)|0x4);
- BEGIN_RING(chan, eng3d, NV30_3D_TEX_UNITS_ENABLE, 1);
- OUT_RING(chan, fp->samplers);
- }
- }
-
- {
- unsigned pointsprite_control = fp->point_sprite_control | nvfx->rasterizer->pipe.point_quad_rasterization;
- if(pointsprite_control != nvfx->hw_pointsprite_control)
- {
- BEGIN_RING(chan, eng3d, NV30_3D_POINT_SPRITE, 1);
- OUT_RING(chan, pointsprite_control);
- nvfx->hw_pointsprite_control = pointsprite_control;
- }
- }
-
- nvfx->relocs_needed &=~ NVFX_RELOCATE_FRAGPROG;
-}
-
-void
-nvfx_fragprog_relocate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nvfx_fragment_program *fp = nvfx->hw_fragprog;
- struct nouveau_bo* bo = fp->fpbo->bo;
- int offset = fp->bo_prog_idx * fp->prog_size;
- unsigned fp_flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_RD; // TODO: GART?
- fp_flags |= NOUVEAU_BO_DUMMY;
- MARK_RING(chan, 2, 2);
- OUT_RELOC(chan, bo, RING_3D(NV30_3D_FP_ACTIVE_PROGRAM, 1), fp_flags, 0, 0);
- OUT_RELOC(chan, bo, offset, fp_flags | NOUVEAU_BO_LOW |
- NOUVEAU_BO_OR, NV30_3D_FP_ACTIVE_PROGRAM_DMA0,
- NV30_3D_FP_ACTIVE_PROGRAM_DMA1);
- nvfx->relocs_needed &=~ NVFX_RELOCATE_FRAGPROG;
-}
-
-void
-nvfx_fragprog_destroy(struct nvfx_context *nvfx,
- struct nvfx_fragment_program *fp)
-{
- unsigned i;
- struct nvfx_fragment_program_bo* fpbo = fp->fpbo;
- if(fpbo)
- {
- do
- {
- struct nvfx_fragment_program_bo* next = fpbo->next;
- nouveau_bo_unmap(fpbo->bo);
- nouveau_bo_ref(0, &fpbo->bo);
- os_free_aligned(fpbo);
- fpbo = next;
- }
- while(fpbo != fp->fpbo);
- }
-
- for(i = 0; i < Elements(fp->slot_relocations); ++i)
- util_dynarray_fini(&fp->slot_relocations[i]);
-
- if (fp->insn_len)
- FREE(fp->insn);
-}
-
-static void *
-nvfx_fp_state_create(struct pipe_context *pipe,
- const struct pipe_shader_state *cso)
-{
- struct nvfx_pipe_fragment_program *pfp;
-
- pfp = CALLOC(1, sizeof(struct nvfx_pipe_fragment_program));
- pfp->pipe.tokens = tgsi_dup_tokens(cso->tokens);
-
- tgsi_scan_shader(pfp->pipe.tokens, &pfp->info);
-
- return (void *)pfp;
-}
-
-static void
-nvfx_fp_state_bind(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->fragprog = hwcso;
- nvfx->dirty |= NVFX_NEW_FRAGPROG;
-}
-
-static void
-nvfx_fp_state_delete(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_pipe_fragment_program *pfp = hwcso;
- unsigned i;
-
- for(i = 0; i < Elements(pfp->fps); ++i)
- {
- if(pfp->fps[i])
- {
- nvfx_fragprog_destroy(nvfx, pfp->fps[i]);
- FREE(pfp->fps[i]);
- }
- }
-
- FREE((void*)pfp->pipe.tokens);
- FREE(pfp);
-}
-
-void
-nvfx_init_fragprog_functions(struct nvfx_context *nvfx)
-{
- nvfx->pipe.create_fs_state = nvfx_fp_state_create;
- nvfx->pipe.bind_fs_state = nvfx_fp_state_bind;
- nvfx->pipe.delete_fs_state = nvfx_fp_state_delete;
-}
+++ /dev/null
-#include "nvfx_context.h"
-#include "nvfx_resource.h"
-#include "nvfx_tex.h"
-
-static void *
-nvfx_sampler_state_create(struct pipe_context *pipe,
- const struct pipe_sampler_state *cso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_sampler_state *ps;
-
- ps = MALLOC(sizeof(struct nvfx_sampler_state));
-
- /* on nv30, we use this as an internal flag */
- ps->fmt = cso->normalized_coords ? 0 : NV40_3D_TEX_FORMAT_RECT;
- ps->en = 0;
- ps->filt = nvfx_tex_filter(cso) | 0x2000; /*voodoo*/
- ps->wrap = (nvfx_tex_wrap_mode(cso->wrap_s) << NV30_3D_TEX_WRAP_S__SHIFT) |
- (nvfx_tex_wrap_mode(cso->wrap_t) << NV30_3D_TEX_WRAP_T__SHIFT) |
- (nvfx_tex_wrap_mode(cso->wrap_r) << NV30_3D_TEX_WRAP_R__SHIFT);
- ps->compare = FALSE;
-
- if(cso->compare_mode == PIPE_TEX_COMPARE_R_TO_TEXTURE)
- {
- ps->wrap |= nvfx_tex_wrap_compare_mode(cso->compare_func);
- ps->compare = TRUE;
- }
- ps->bcol = nvfx_tex_border_color(cso->border_color.f);
-
- if(nvfx->is_nv4x)
- nv40_sampler_state_init(pipe, ps, cso);
- else
- nv30_sampler_state_init(pipe, ps, cso);
-
- return (void *)ps;
-}
-
-static void
-nvfx_sampler_state_delete(struct pipe_context *pipe, void *hwcso)
-{
- FREE(hwcso);
-}
-
-static void
-nvfx_sampler_state_bind(struct pipe_context *pipe, unsigned nr, void **sampler)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- unsigned unit;
-
- for (unit = 0; unit < nr; unit++) {
- nvfx->tex_sampler[unit] = sampler[unit];
- nvfx->dirty_samplers |= (1 << unit);
- }
-
- for (unit = nr; unit < nvfx->nr_samplers; unit++) {
- nvfx->tex_sampler[unit] = NULL;
- nvfx->dirty_samplers |= (1 << unit);
- }
-
- nvfx->nr_samplers = nr;
- nvfx->dirty |= NVFX_NEW_SAMPLER;
-}
-
-static struct pipe_sampler_view *
-nvfx_create_sampler_view(struct pipe_context *pipe,
- struct pipe_resource *pt,
- const struct pipe_sampler_view *templ)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_sampler_view *sv = CALLOC_STRUCT(nvfx_sampler_view);
- struct nvfx_texture_format *tf = &nvfx_texture_formats[templ->format];
- unsigned txf;
-
- if (!sv)
- return NULL;
-
- sv->base = *templ;
- sv->base.reference.count = 1;
- sv->base.texture = NULL;
- pipe_resource_reference(&sv->base.texture, pt);
- sv->base.context = pipe;
-
- txf = NV30_3D_TEX_FORMAT_NO_BORDER;
-
- switch (pt->target) {
- case PIPE_TEXTURE_CUBE:
- txf |= NV30_3D_TEX_FORMAT_CUBIC;
- /* fall-through */
- case PIPE_TEXTURE_2D:
- case PIPE_TEXTURE_RECT:
- txf |= NV30_3D_TEX_FORMAT_DIMS_2D;
- break;
- case PIPE_TEXTURE_3D:
- txf |= NV30_3D_TEX_FORMAT_DIMS_3D;
- break;
- case PIPE_TEXTURE_1D:
- txf |= NV30_3D_TEX_FORMAT_DIMS_1D;
- break;
- default:
- assert(0);
- }
- sv->u.init_fmt = txf;
-
- sv->swizzle = 0
- | (tf->src[sv->base.swizzle_r] << NV30_3D_TEX_SWIZZLE_S0_Z__SHIFT)
- | (tf->src[sv->base.swizzle_g] << NV30_3D_TEX_SWIZZLE_S0_Y__SHIFT)
- | (tf->src[sv->base.swizzle_b] << NV30_3D_TEX_SWIZZLE_S0_X__SHIFT)
- | (tf->src[sv->base.swizzle_a] << NV30_3D_TEX_SWIZZLE_S0_W__SHIFT)
- | (tf->comp[sv->base.swizzle_r] << NV30_3D_TEX_SWIZZLE_S1_Z__SHIFT)
- | (tf->comp[sv->base.swizzle_g] << NV30_3D_TEX_SWIZZLE_S1_Y__SHIFT)
- | (tf->comp[sv->base.swizzle_b] << NV30_3D_TEX_SWIZZLE_S1_X__SHIFT)
- | (tf->comp[sv->base.swizzle_a] << NV30_3D_TEX_SWIZZLE_S1_W__SHIFT);
-
- sv->filt = tf->sign;
- sv->wrap = tf->wrap;
- sv->wrap_mask = ~0;
-
- if (pt->target == PIPE_TEXTURE_CUBE)
- {
- sv->offset = 0;
- sv->npot_size = (pt->width0 << NV30_3D_TEX_NPOT_SIZE_W__SHIFT) | pt->height0;
- }
- else
- {
- sv->offset = nvfx_subresource_offset(pt, 0, sv->base.u.tex.first_level, 0);
- sv->npot_size = (u_minify(pt->width0, sv->base.u.tex.first_level) << NV30_3D_TEX_NPOT_SIZE_W__SHIFT) | u_minify(pt->height0, sv->base.u.tex.first_level);
-
- /* apparently, we need to ignore the t coordinate for 1D textures to fix piglit tex1d-2dborder */
- if(pt->target == PIPE_TEXTURE_1D)
- {
- sv->wrap_mask &=~ NV30_3D_TEX_WRAP_T__MASK;
- sv->wrap |= NV30_3D_TEX_WRAP_T_REPEAT;
- }
- }
-
- if(nvfx->is_nv4x)
- nv40_sampler_view_init(pipe, sv);
- else
- nv30_sampler_view_init(pipe, sv);
-
- return &sv->base;
-}
-
-static void
-nvfx_sampler_view_destroy(struct pipe_context *pipe,
- struct pipe_sampler_view *view)
-{
- pipe_resource_reference(&view->texture, NULL);
- FREE(view);
-}
-
-static void
-nvfx_set_fragment_sampler_views(struct pipe_context *pipe,
- unsigned nr,
- struct pipe_sampler_view **views)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- unsigned unit;
-
- for (unit = 0; unit < nr; unit++) {
- pipe_sampler_view_reference(&nvfx->fragment_sampler_views[unit],
- views[unit]);
- nvfx->dirty_samplers |= (1 << unit);
- }
-
- for (unit = nr; unit < nvfx->nr_textures; unit++) {
- pipe_sampler_view_reference(&nvfx->fragment_sampler_views[unit],
- NULL);
- nvfx->dirty_samplers |= (1 << unit);
- }
-
- nvfx->nr_textures = nr;
- nvfx->dirty |= NVFX_NEW_SAMPLER;
-}
-
-void
-nvfx_fragtex_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- unsigned samplers, unit;
-
- samplers = nvfx->dirty_samplers;
- if(!samplers)
- return;
-
- while (samplers) {
- unit = ffs(samplers) - 1;
- samplers &= ~(1 << unit);
-
- if(nvfx->fragment_sampler_views[unit] && nvfx->tex_sampler[unit]) {
- if(!nvfx->is_nv4x)
- nv30_fragtex_set(nvfx, unit);
- else
- nv40_fragtex_set(nvfx, unit);
- } else {
- /* this is OK for nv40 too */
- BEGIN_RING(chan, eng3d, NV30_3D_TEX_ENABLE(unit), 1);
- OUT_RING(chan, 0);
- nvfx->hw_samplers &= ~(1 << unit);
- }
- }
- nvfx->dirty_samplers = 0;
- nvfx->relocs_needed &=~ NVFX_RELOCATE_FRAGTEX;
-}
-
-void
-nvfx_fragtex_relocate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- unsigned samplers, unit;
- unsigned tex_flags = NOUVEAU_BO_VRAM | NOUVEAU_BO_GART | NOUVEAU_BO_RD;
-
- samplers = nvfx->hw_samplers;
- while (samplers) {
- struct nvfx_miptree* mt;
- struct nouveau_bo *bo;
-
- unit = ffs(samplers) - 1;
- samplers &= ~(1 << unit);
-
- mt = (struct nvfx_miptree*)nvfx->fragment_sampler_views[unit]->texture;
- bo = mt->base.bo;
-
- MARK_RING(chan, 3, 3);
- OUT_RELOC(chan, bo, RING_3D(NV30_3D_TEX_OFFSET(unit), 2), tex_flags | NOUVEAU_BO_DUMMY, 0, 0);
- OUT_RELOC(chan, bo, 0, tex_flags | NOUVEAU_BO_LOW | NOUVEAU_BO_DUMMY, 0, 0);
- OUT_RELOC(chan, bo, nvfx->hw_txf[unit], tex_flags | NOUVEAU_BO_OR | NOUVEAU_BO_DUMMY,
- NV30_3D_TEX_FORMAT_DMA0, NV30_3D_TEX_FORMAT_DMA1);
- }
- nvfx->relocs_needed &=~ NVFX_RELOCATE_FRAGTEX;
-}
-
-void
-nvfx_init_sampling_functions(struct nvfx_context *nvfx)
-{
- nvfx->pipe.create_sampler_state = nvfx_sampler_state_create;
- nvfx->pipe.bind_fragment_sampler_states = nvfx_sampler_state_bind;
- nvfx->pipe.delete_sampler_state = nvfx_sampler_state_delete;
- nvfx->pipe.set_fragment_sampler_views = nvfx_set_fragment_sampler_views;
- nvfx->pipe.create_sampler_view = nvfx_create_sampler_view;
- nvfx->pipe.sampler_view_destroy = nvfx_sampler_view_destroy;
-}
-
-#define NV30_3D_TEX_FORMAT_FORMAT_DXT1_RECT NV30_3D_TEX_FORMAT_FORMAT_DXT1
-#define NV30_3D_TEX_FORMAT_FORMAT_DXT3_RECT NV30_3D_TEX_FORMAT_FORMAT_DXT3
-#define NV30_3D_TEX_FORMAT_FORMAT_DXT5_RECT NV30_3D_TEX_FORMAT_FORMAT_DXT5
-
-#define NV40_3D_TEX_FORMAT_FORMAT_HILO16 NV40_3D_TEX_FORMAT_FORMAT_A16L16
-
-#define NV30_3D_TEX_FORMAT_FORMAT_RGBA16F 0x00004a00
-#define NV30_3D_TEX_FORMAT_FORMAT_RGBA16F_RECT NV30_3D_TEX_FORMAT_FORMAT_RGBA16F
-#define NV30_3D_TEX_FORMAT_FORMAT_RGBA32F 0x00004b00
-#define NV30_3D_TEX_FORMAT_FORMAT_RGBA32F_RECT NV30_3D_TEX_FORMAT_FORMAT_RGBA32F
-#define NV30_3D_TEX_FORMAT_FORMAT_R32F 0x00004c00
-#define NV30_3D_TEX_FORMAT_FORMAT_R32F_RECT NV30_3D_TEX_FORMAT_FORMAT_R32F
-
-// TODO: guess!
-#define NV40_3D_TEX_FORMAT_FORMAT_R32F 0x00001c00
-
-#define SRGB 0x00700000
-
-#define __(m,tf,tfc,ts0x,ts0y,ts0z,ts0w,ts1x,ts1y,ts1z,ts1w,sign,wrap) \
-[PIPE_FORMAT_##m] = { \
- {NV30_3D_TEX_FORMAT_FORMAT_##tf, \
- NV30_3D_TEX_FORMAT_FORMAT_##tfc, \
- NV30_3D_TEX_FORMAT_FORMAT_##tf##_RECT, \
- NV30_3D_TEX_FORMAT_FORMAT_##tfc##_RECT, \
- NV40_3D_TEX_FORMAT_FORMAT_##tf, \
- NV40_3D_TEX_FORMAT_FORMAT_##tfc}, \
- sign, wrap, \
- {ts0z, ts0y, ts0x, ts0w, 0, 1}, {ts1z, ts1y, ts1x, ts1w, 0, 0} \
-}
-
-#define _(m,tf,ts0x,ts0y,ts0z,ts0w,ts1x,ts1y,ts1z,ts1w,sign, wrap) \
- __(m,tf,tf,ts0x,ts0y,ts0z,ts0w,ts1x,ts1y,ts1z,ts1w,sign, wrap)
-
-/* Depth formats works by reading the depth value most significant 8/16 bits.
- * We are losing precision, but nVidia loses even more by using A8R8G8B8 instead of HILO16
- * There is no 32-bit integer texture support, so other things are infeasible.
- *
- * TODO: is it possible to read 16 bits for Z16? A16 doesn't seem to work, either due to normalization or endianness issues
- */
-
-#define T 2
-
-#define X 3
-#define Y 2
-#define Z 1
-#define W 0
-
-#define SNORM ((NV30_3D_TEX_FILTER_SIGNED_RED) | (NV30_3D_TEX_FILTER_SIGNED_GREEN) | (NV30_3D_TEX_FILTER_SIGNED_BLUE) | (NV30_3D_TEX_FILTER_SIGNED_ALPHA))
-#define UNORM 0
-
-struct nvfx_texture_format
-nvfx_texture_formats[PIPE_FORMAT_COUNT] = {
- [0 ... PIPE_FORMAT_COUNT - 1] = {{-1, -1, -1, -1, -1, -1}},
- _(B8G8R8X8_UNORM, A8R8G8B8, T, T, T, 1, X, Y, Z, W, UNORM, 0),
- _(B8G8R8X8_SRGB, A8R8G8B8, T, T, T, 1, X, Y, Z, W, UNORM, SRGB),
- _(B8G8R8A8_UNORM, A8R8G8B8, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(B8G8R8A8_SRGB, A8R8G8B8, T, T, T, T, X, Y, Z, W, UNORM, SRGB),
-
- _(R8G8B8A8_UNORM, A8R8G8B8, T, T, T, T, Z, Y, X, W, UNORM, 0),
- _(R8G8B8A8_SRGB, A8R8G8B8, T, T, T, T, Z, Y, X, W, UNORM, SRGB),
- _(R8G8B8X8_UNORM, A8R8G8B8, T, T, T, 1, Z, Y, X, W, UNORM, 0),
-
- _(A8R8G8B8_UNORM, A8R8G8B8, T, T, T, T, W, Z, Y, X, UNORM, 0),
- _(A8R8G8B8_SRGB, A8R8G8B8, T, T, T, T, W, Z, Y, X, UNORM, SRGB),
- _(A8B8G8R8_UNORM, A8R8G8B8, T, T, T, T, W, X, Y, Z, UNORM, 0),
- _(A8B8G8R8_SRGB, A8R8G8B8, T, T, T, T, W, X, Y, Z, UNORM, SRGB),
- _(X8R8G8B8_UNORM, A8R8G8B8, T, T, T, 1, W, Z, Y, X, UNORM, 0),
- _(X8R8G8B8_SRGB, A8R8G8B8, T, T, T, 1, W, Z, Y, X, UNORM, SRGB),
-
- _(B5G5R5A1_UNORM, A1R5G5B5, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(B5G5R5X1_UNORM, A1R5G5B5, T, T, T, 1, X, Y, Z, W, UNORM, 0),
-
- _(B4G4R4A4_UNORM, A4R4G4B4, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(B4G4R4X4_UNORM, A4R4G4B4, T, T, T, 1, X, Y, Z, W, UNORM, 0),
-
- _(B5G6R5_UNORM, R5G6B5, T, T, T, 1, X, Y, Z, W, UNORM, 0),
-
- _(R8_UNORM, L8, T, 0, 0, 1, X, X, X, X, UNORM, 0),
- _(R8_SNORM, L8, T, 0, 0, 1, X, X, X, X, SNORM, 0),
- _(L8_UNORM, L8, T, T, T, 1, X, X, X, X, UNORM, 0),
- _(L8_SRGB, L8, T, T, T, 1, X, X, X, X, UNORM, SRGB),
- _(A8_UNORM, L8, 0, 0, 0, T, X, X, X, X, UNORM, 0),
- _(I8_UNORM, L8, T, T, T, T, X, X, X, X, UNORM, 0),
-
- _(R8G8_UNORM, A8L8, T, T, T, T, X, X, X, W, UNORM, 0),
- _(R8G8_SNORM, A8L8, T, T, T, T, X, X, X, W, SNORM, 0),
- _(L8A8_UNORM, A8L8, T, T, T, T, X, X, X, W, UNORM, 0),
- _(L8A8_SRGB, A8L8, T, T, T, T, X, X, X, W, UNORM, SRGB),
-
- _(DXT1_RGB, DXT1, T, T, T, 1, X, Y, Z, W, UNORM, 0),
- _(DXT1_SRGB, DXT1, T, T, T, 1, X, Y, Z, W, UNORM, SRGB),
- _(DXT1_RGBA, DXT1, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(DXT1_SRGBA, DXT1, T, T, T, T, X, Y, Z, W, UNORM, SRGB),
- _(DXT3_RGBA, DXT3, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(DXT3_SRGBA, DXT3, T, T, T, T, X, Y, Z, W, UNORM, SRGB),
- _(DXT5_RGBA, DXT5, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(DXT5_SRGBA, DXT5, T, T, T, T, X, Y, Z, W, UNORM, SRGB),
-
- __(Z16_UNORM, A8L8, Z16, T, T, T, 1, W, W, W, W, UNORM, 0),
- __(S8_UINT_Z24_UNORM,HILO16,Z24, T, T, T, 1, W, W, W, W, UNORM, 0),
- __(X8Z24_UNORM, HILO16,Z24, T, T, T, 1, W, W, W, W, UNORM, 0),
-
- _(R16_UNORM, A16, T, 0, 0, 1, X, X, X, X, UNORM, 0),
- _(R16_SNORM, A16, T, 0, 0, 1, X, X, X, X, SNORM, 0),
- _(R16G16_UNORM, HILO16, T, T, 0, 1, X, Y, X, X, UNORM, 0),
- _(R16G16_SNORM, HILO16, T, T, 0, 1, X, Y, X, X, SNORM, 0),
-
- _(R16G16B16A16_FLOAT, RGBA16F, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(R32G32B32A32_FLOAT, RGBA32F, T, T, T, T, X, Y, Z, W, UNORM, 0),
- _(R32_FLOAT, R32F, T, 0, 0, 1, X, X, X, X, UNORM, 0)
-};
+++ /dev/null
-#include "pipe/p_state.h"
-#include "pipe/p_defines.h"
-#include "util/u_inlines.h"
-#include "util/u_format.h"
-#include "util/u_memory.h"
-#include "util/u_math.h"
-#include "util/u_staging.h"
-#include "state_tracker/drm_driver.h"
-#include "nouveau/nouveau_winsys.h"
-#include "nouveau/nouveau_screen.h"
-#include "nvfx_screen.h"
-#include "nvfx_resource.h"
-
-static void
-nvfx_miptree_choose_format(struct nvfx_miptree *mt)
-{
- struct pipe_resource *pt = &mt->base.base;
- unsigned uniform_pitch = 0;
- static int no_swizzle = -1;
- if(no_swizzle < 0)
- no_swizzle = debug_get_bool_option("NV40_NO_SWIZZLE", FALSE); /* this will break things on nv30 */
-
- if (!util_is_power_of_two(pt->width0) ||
- !util_is_power_of_two(pt->height0) ||
- !util_is_power_of_two(pt->depth0) ||
- (!nvfx_screen(pt->screen)->is_nv4x && pt->target == PIPE_TEXTURE_RECT)
- )
- uniform_pitch = 1;
-
- if (
- (pt->bind & (PIPE_BIND_SCANOUT | PIPE_BIND_DISPLAY_TARGET))
- || (pt->usage & PIPE_USAGE_DYNAMIC) || (pt->usage & PIPE_USAGE_STAGING)
- || util_format_is_compressed(pt->format)
- || no_swizzle
- )
- mt->base.base.flags |= NOUVEAU_RESOURCE_FLAG_LINEAR;
-
- /* non compressed formats with uniform pitch must be linear, and vice versa */
- if(!util_format_is_s3tc(pt->format)
- && (uniform_pitch || mt->base.base.flags & NOUVEAU_RESOURCE_FLAG_LINEAR))
- {
- mt->base.base.flags |= NOUVEAU_RESOURCE_FLAG_LINEAR;
- uniform_pitch = 1;
- }
-
- if(uniform_pitch)
- {
- mt->linear_pitch = util_format_get_stride(pt->format, pt->width0);
-
- // TODO: this is only a constraint for rendering and not sampling, apparently
- // we may also want this unconditionally
- if(pt->bind & (PIPE_BIND_SAMPLER_VIEW |
- PIPE_BIND_DEPTH_STENCIL |
- PIPE_BIND_RENDER_TARGET |
- PIPE_BIND_DISPLAY_TARGET |
- PIPE_BIND_SCANOUT))
- mt->linear_pitch = align(mt->linear_pitch, 64);
- }
- else
- mt->linear_pitch = 0;
-}
-
-static unsigned
-nvfx_miptree_layout(struct nvfx_miptree *mt)
-{
- struct pipe_resource* pt = &mt->base.base;
- uint offset = 0;
-
- if(!nvfx_screen(pt->screen)->is_nv4x)
- {
- assert(pt->target == PIPE_TEXTURE_RECT
- || (util_is_power_of_two(pt->width0) && util_is_power_of_two(pt->height0)));
- }
-
- for (unsigned l = 0; l <= pt->last_level; l++)
- {
- unsigned size;
- mt->level_offset[l] = offset;
-
- if(mt->linear_pitch)
- size = mt->linear_pitch;
- else
- size = util_format_get_stride(pt->format, u_minify(pt->width0, l));
- size = util_format_get_2d_size(pt->format, size, u_minify(pt->height0, l));
-
- if(pt->target == PIPE_TEXTURE_3D)
- size *= u_minify(pt->depth0, l);
-
- offset += size;
- }
-
- offset = align(offset, 128);
- mt->face_size = offset;
- if(mt->base.base.target == PIPE_TEXTURE_CUBE)
- offset += 5 * mt->face_size;
- return offset;
-}
-
-static void
-nvfx_miptree_surface_final_destroy(struct pipe_surface* ps)
-{
- pipe_resource_reference(&ps->texture, 0);
- FREE(ps);
-}
-
-void
-nvfx_miptree_destroy(struct pipe_screen *screen, struct pipe_resource *pt)
-{
- struct nvfx_miptree *mt = (struct nvfx_miptree *)pt;
- util_surfaces_destroy(&mt->surfaces, pt, nvfx_miptree_surface_final_destroy);
- nouveau_screen_bo_release(screen, mt->base.bo);
- FREE(mt);
-}
-
-static struct nvfx_miptree*
-nvfx_miptree_create_skeleton(struct pipe_screen *pscreen, const struct pipe_resource *pt)
-{
- struct nvfx_miptree *mt;
-
- if(pt->width0 > 4096 || pt->height0 > 4096)
- return NULL;
-
- mt = CALLOC_STRUCT(nvfx_miptree);
- if (!mt)
- return NULL;
-
- mt->base.base = *pt;
-
- pipe_reference_init(&mt->base.base.reference, 1);
- mt->base.base.screen = pscreen;
-
- // set this to the actual capabilities, we use it to decide whether to use the 3D engine for copies
- // TODO: is this the correct way to use Gallium?
- mt->base.base.bind = pt->bind | PIPE_BIND_RENDER_TARGET | PIPE_BIND_SAMPLER_VIEW | PIPE_BIND_DEPTH_STENCIL;
-
- // on our current driver (and the driver too), format support does not depend on geometry, so don't bother computing it
- // TODO: may want to revisit this
- if(!pscreen->is_format_supported(pscreen, pt->format, pt->target, 0, PIPE_BIND_RENDER_TARGET))
- mt->base.base.bind &=~ PIPE_BIND_RENDER_TARGET;
- if(!pscreen->is_format_supported(pscreen, pt->format, pt->target, 0, PIPE_BIND_SAMPLER_VIEW))
- mt->base.base.bind &=~ PIPE_BIND_SAMPLER_VIEW;
- if(!pscreen->is_format_supported(pscreen, pt->format, pt->target, 0, PIPE_BIND_DEPTH_STENCIL))
- mt->base.base.bind &=~ PIPE_BIND_DEPTH_STENCIL;
-
- return mt;
-}
-
-
-struct pipe_resource *
-nvfx_miptree_create(struct pipe_screen *pscreen, const struct pipe_resource *pt)
-{
- struct nvfx_miptree* mt = nvfx_miptree_create_skeleton(pscreen, pt);
- unsigned size;
- nvfx_miptree_choose_format(mt);
-
- size = nvfx_miptree_layout(mt);
-
- mt->base.bo = nouveau_screen_bo_new(pscreen, 256, pt->usage, pt->bind, size);
-
- if (!mt->base.bo) {
- FREE(mt);
- return NULL;
- }
- return &mt->base.base;
-}
-
-// TODO: redo this, just calling miptree_layout
-struct pipe_resource *
-nvfx_miptree_from_handle(struct pipe_screen *pscreen, const struct pipe_resource *template, struct winsys_handle *whandle)
-{
- struct nvfx_miptree* mt = nvfx_miptree_create_skeleton(pscreen, template);
- unsigned stride;
- if(whandle->stride) {
- mt->linear_pitch = whandle->stride;
- mt->base.base.flags |= NOUVEAU_RESOURCE_FLAG_LINEAR;
- } else
- nvfx_miptree_choose_format(mt);
-
- nvfx_miptree_layout(mt);
-
- mt->base.bo = nouveau_screen_bo_from_handle(pscreen, whandle, &stride);
- if (mt->base.bo == NULL) {
- FREE(mt);
- return NULL;
- }
- return &mt->base.base;
-}
-
-struct pipe_surface *
-nvfx_miptree_surface_new(struct pipe_context *pipe, struct pipe_resource *pt,
- const struct pipe_surface *surf_tmpl)
-{
- struct nvfx_miptree *mt = (struct nvfx_miptree *)pt;
- unsigned level = surf_tmpl->u.tex.level;
- struct nvfx_surface *ns = NULL;
-
- assert(surf_tmpl->u.tex.first_layer == surf_tmpl->u.tex.last_layer);
- if(util_surfaces_get(&mt->surfaces, sizeof(struct nvfx_surface), pipe,
- pt, level, surf_tmpl->u.tex.first_layer,
- surf_tmpl->usage, (struct pipe_surface **)&ns)) {
- ns->pitch = nvfx_subresource_pitch(pt, level);
- ns->offset = nvfx_subresource_offset(pt, surf_tmpl->u.tex.first_layer, level, surf_tmpl->u.tex.first_layer);
- }
-
- return &ns->base;
-}
-
-void
-nvfx_miptree_surface_del(struct pipe_context *pipe, struct pipe_surface *ps)
-{
- util_surfaces_detach(&((struct nvfx_miptree*)ps->texture)->surfaces, ps);
- pipe_resource_reference(&ps->texture, 0);
- FREE(ps);
-}
+++ /dev/null
-#include "pipe/p_context.h"
-#include "pipe/p_state.h"
-#include "util/u_inlines.h"
-#include "util/u_format.h"
-#include "util/u_split_prim.h"
-#include "translate/translate.h"
-
-#include "nvfx_context.h"
-#include "nvfx_resource.h"
-
-struct push_context {
- struct nouveau_channel* chan;
- struct nouveau_grobj *eng3d;
-
- void *idxbuf;
- int32_t idxbias;
-
- float edgeflag;
- int edgeflag_attr;
-
- unsigned vertex_length;
- unsigned max_vertices_per_packet;
-
- struct translate* translate;
-};
-
-static void
-emit_edgeflag(void *priv, boolean enabled)
-{
- struct push_context* ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- struct nouveau_channel *chan = ctx->chan;
-
- BEGIN_RING(chan, eng3d, NV30_3D_EDGEFLAG, 1);
- OUT_RING(chan, enabled ? 1 : 0);
-}
-
-static void
-emit_vertices_lookup8(void *priv, unsigned start, unsigned count)
-{
- struct push_context *ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- uint8_t* elts = (uint8_t*)ctx->idxbuf + start;
-
- while(count)
- {
- unsigned push = MIN2(count, ctx->max_vertices_per_packet);
- unsigned length = push * ctx->vertex_length;
-
- BEGIN_RING_NI(ctx->chan, eng3d, NV30_3D_VERTEX_DATA, length);
- ctx->translate->run_elts8(ctx->translate, elts, push, 0, ctx->chan->cur);
- ctx->chan->cur += length;
-
- count -= push;
- elts += push;
- }
-}
-
-static void
-emit_vertices_lookup16(void *priv, unsigned start, unsigned count)
-{
- struct push_context *ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- uint16_t* elts = (uint16_t*)ctx->idxbuf + start;
-
- while(count)
- {
- unsigned push = MIN2(count, ctx->max_vertices_per_packet);
- unsigned length = push * ctx->vertex_length;
-
- BEGIN_RING_NI(ctx->chan, eng3d, NV30_3D_VERTEX_DATA, length);
- ctx->translate->run_elts16(ctx->translate, elts, push, 0, ctx->chan->cur);
- ctx->chan->cur += length;
-
- count -= push;
- elts += push;
- }
-}
-
-static void
-emit_vertices_lookup32(void *priv, unsigned start, unsigned count)
-{
- struct push_context *ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- uint32_t* elts = (uint32_t*)ctx->idxbuf + start;
-
- while(count)
- {
- unsigned push = MIN2(count, ctx->max_vertices_per_packet);
- unsigned length = push * ctx->vertex_length;
-
- BEGIN_RING_NI(ctx->chan, eng3d, NV30_3D_VERTEX_DATA, length);
- ctx->translate->run_elts(ctx->translate, elts, push, 0, ctx->chan->cur);
- ctx->chan->cur += length;
-
- count -= push;
- elts += push;
- }
-}
-
-static void
-emit_vertices(void *priv, unsigned start, unsigned count)
-{
- struct push_context *ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
-
- while(count)
- {
- unsigned push = MIN2(count, ctx->max_vertices_per_packet);
- unsigned length = push * ctx->vertex_length;
-
- BEGIN_RING_NI(ctx->chan, eng3d, NV30_3D_VERTEX_DATA, length);
- ctx->translate->run(ctx->translate, start, push, 0, ctx->chan->cur);
- ctx->chan->cur += length;
-
- count -= push;
- start += push;
- }
-}
-
-static void
-emit_ranges(void* priv, unsigned start, unsigned vc, unsigned reg)
-{
- struct push_context* ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- struct nouveau_channel *chan = ctx->chan;
- unsigned nr = (vc & 0xff);
- if (nr) {
- BEGIN_RING(chan, eng3d, reg, 1);
- OUT_RING (chan, ((nr - 1) << 24) | start);
- start += nr;
- }
-
- nr = vc >> 8;
- while (nr) {
- unsigned push = nr > 2047 ? 2047 : nr;
-
- nr -= push;
-
- BEGIN_RING_NI(chan, eng3d, reg, push);
- while (push--) {
- OUT_RING(chan, ((0x100 - 1) << 24) | start);
- start += 0x100;
- }
- }
-}
-
-static void
-emit_ib_ranges(void* priv, unsigned start, unsigned vc)
-{
- emit_ranges(priv, start, vc, NV30_3D_VB_INDEX_BATCH);
-}
-
-static void
-emit_vb_ranges(void* priv, unsigned start, unsigned vc)
-{
- emit_ranges(priv, start, vc, NV30_3D_VB_VERTEX_BATCH);
-}
-
-static INLINE void
-emit_elt8(void* priv, unsigned start, unsigned vc)
-{
- struct push_context* ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- struct nouveau_channel *chan = ctx->chan;
- uint8_t *elts = (uint8_t *)ctx->idxbuf + start;
- int idxbias = ctx->idxbias;
-
- if (vc & 1) {
- BEGIN_RING(chan, eng3d, NV30_3D_VB_ELEMENT_U32, 1);
- OUT_RING (chan, elts[0]);
- elts++; vc--;
- }
-
- while (vc) {
- unsigned i;
- unsigned push = MIN2(vc, 2047 * 2);
-
- BEGIN_RING_NI(chan, eng3d, NV30_3D_VB_ELEMENT_U16, push >> 1);
- for (i = 0; i < push; i+=2)
- OUT_RING(chan, ((elts[i+1] + idxbias) << 16) | (elts[i] + idxbias));
-
- vc -= push;
- elts += push;
- }
-}
-
-static INLINE void
-emit_elt16(void* priv, unsigned start, unsigned vc)
-{
- struct push_context* ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- struct nouveau_channel *chan = ctx->chan;
- uint16_t *elts = (uint16_t *)ctx->idxbuf + start;
- int idxbias = ctx->idxbias;
-
- if (vc & 1) {
- BEGIN_RING(chan, eng3d, NV30_3D_VB_ELEMENT_U32, 1);
- OUT_RING (chan, elts[0]);
- elts++; vc--;
- }
-
- while (vc) {
- unsigned i;
- unsigned push = MIN2(vc, 2047 * 2);
-
- BEGIN_RING_NI(chan, eng3d, NV30_3D_VB_ELEMENT_U16, push >> 1);
- for (i = 0; i < push; i+=2)
- OUT_RING(chan, ((elts[i+1] + idxbias) << 16) | (elts[i] + idxbias));
-
- vc -= push;
- elts += push;
- }
-}
-
-static INLINE void
-emit_elt32(void* priv, unsigned start, unsigned vc)
-{
- struct push_context* ctx = priv;
- struct nouveau_grobj *eng3d = ctx->eng3d;
- struct nouveau_channel *chan = ctx->chan;
- uint32_t *elts = (uint32_t *)ctx->idxbuf + start;
- int idxbias = ctx->idxbias;
-
- while (vc) {
- unsigned push = MIN2(vc, 2047);
-
- BEGIN_RING_NI(chan, eng3d, NV30_3D_VB_ELEMENT_U32, push);
- if(idxbias)
- {
- for(unsigned i = 0; i < push; ++i)
- OUT_RING(chan, elts[i] + idxbias);
- }
- else
- OUT_RINGp(chan, elts, push);
-
- vc -= push;
- elts += push;
- }
-}
-
-void
-nvfx_push_vbo(struct pipe_context *pipe, const struct pipe_draw_info *info)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct push_context ctx;
- struct util_split_prim s;
- unsigned instances_left = info->instance_count;
- int vtx_value;
- unsigned hw_mode = nvgl_primitive(info->mode);
- int i;
- struct
- {
- uint8_t* map;
- unsigned step;
- } per_instance[16];
- unsigned p_overhead = 64 /* magic fix */
- + 4 /* begin/end */
- + 4; /* potential edgeflag enable/disable */
-
- ctx.chan = nvfx->screen->base.channel;
- ctx.eng3d = nvfx->screen->eng3d;
- ctx.translate = nvfx->vtxelt->translate;
- ctx.idxbuf = NULL;
- ctx.vertex_length = nvfx->vtxelt->vertex_length;
- ctx.max_vertices_per_packet = nvfx->vtxelt->max_vertices_per_packet;
- ctx.edgeflag = 0.5f;
- // TODO: figure out if we really want to handle this, and do so in that case
- ctx.edgeflag_attr = 0xff; // nvfx->vertprog->cfg.edgeflag_in;
-
- if(!nvfx->use_vertex_buffers)
- {
- for(i = 0; i < nvfx->vtxelt->num_per_vertex_buffer_infos; ++i)
- {
- struct nvfx_per_vertex_buffer_info* vbi = &nvfx->vtxelt->per_vertex_buffer_info[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[vbi->vertex_buffer_index];
- uint8_t* data = nvfx_buffer(vb->buffer)->data + vb->buffer_offset;
- if(info->indexed)
- data += info->index_bias * vb->stride;
- ctx.translate->set_buffer(ctx.translate, i, data, vb->stride, ~0);
- }
-
- if(ctx.edgeflag_attr < 16)
- vtx_value = -(ctx.vertex_length + 3); /* vertex data and edgeflag header and value */
- else
- {
- p_overhead += 1; /* initial vertex_data header */
- vtx_value = -ctx.vertex_length; /* vertex data and edgeflag header and value */
- }
-
- if (info->indexed) {
- // XXX: this case and is broken and probably need a new VTX_ATTR push path
- if (nvfx->idxbuf.index_size == 1)
- s.emit = emit_vertices_lookup8;
- else if (nvfx->idxbuf.index_size == 2)
- s.emit = emit_vertices_lookup16;
- else
- s.emit = emit_vertices_lookup32;
- } else
- s.emit = emit_vertices;
- }
- else
- {
- if(!info->indexed || nvfx->use_index_buffer)
- {
- s.emit = info->indexed ? emit_ib_ranges : emit_vb_ranges;
- p_overhead += 3;
- vtx_value = 0;
- }
- else if (nvfx->idxbuf.index_size == 4)
- {
- s.emit = emit_elt32;
- p_overhead += 1;
- vtx_value = 8;
- }
- else
- {
- s.emit = (nvfx->idxbuf.index_size == 2) ? emit_elt16 : emit_elt8;
- p_overhead += 3;
- vtx_value = 7;
- }
- }
-
- ctx.idxbias = info->index_bias;
- if(nvfx->use_vertex_buffers)
- ctx.idxbias -= nvfx->base_vertex;
-
- /* map index buffer, if present */
- if (info->indexed && !nvfx->use_index_buffer)
- ctx.idxbuf = nvfx_buffer(nvfx->idxbuf.buffer)->data + nvfx->idxbuf.offset;
-
- s.priv = &ctx;
- s.edge = emit_edgeflag;
-
- for (i = 0; i < nvfx->vtxelt->num_per_instance; ++i)
- {
- struct nvfx_per_instance_element *ve = &nvfx->vtxelt->per_instance[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[ve->base.vertex_buffer_index];
- float v[4];
- per_instance[i].step = info->start_instance % ve->instance_divisor;
- per_instance[i].map = nvfx_buffer(vb->buffer)->data + vb->buffer_offset + ve->base.src_offset;
-
- nvfx->vtxelt->per_instance[i].base.fetch_rgba_float(v, per_instance[i].map, 0, 0);
-
- nvfx_emit_vtx_attr(chan, eng3d,
- nvfx->vtxelt->per_instance[i].base.idx, v,
- nvfx->vtxelt->per_instance[i].base.ncomp);
- }
-
- /* per-instance loop */
- while (instances_left--) {
- int max_verts;
- boolean done;
-
- util_split_prim_init(&s, info->mode, info->start, info->count);
- nvfx_state_emit(nvfx);
- for(;;) {
- max_verts = AVAIL_RING(chan);
- max_verts -= p_overhead;
-
- /* if vtx_value < 0, each vertex is -vtx_value words long
- * otherwise, each vertex is 2^(vtx_value) / 255 words long (this is an approximation)
- */
- if(vtx_value < 0)
- {
- max_verts /= -vtx_value;
- max_verts -= (max_verts >> 10); /* vertex data headers */
- }
- else
- {
- if(max_verts >= (1 << 23)) /* avoid overflow here */
- max_verts = (1 << 23);
- max_verts = (max_verts * 255) >> vtx_value;
- }
-
- //printf("avail %u max_verts %u\n", AVAIL_RING(chan), max_verts);
-
- if(max_verts >= 16)
- {
- /* XXX: any command a lot of times seems to (mostly) fix corruption that would otherwise happen */
- /* this seems to cause issues on nv3x, and also be unneeded there */
- if(nvfx->is_nv4x)
- {
- int i;
- for(i = 0; i < 32; ++i)
- {
- BEGIN_RING(chan, eng3d,
- 0x1dac, 1);
- OUT_RING(chan, 0);
- }
- }
-
- BEGIN_RING(chan, eng3d,
- NV30_3D_VERTEX_BEGIN_END, 1);
- OUT_RING(chan, hw_mode);
- done = util_split_prim_next(&s, max_verts);
- BEGIN_RING(chan, eng3d,
- NV30_3D_VERTEX_BEGIN_END, 1);
- OUT_RING(chan, 0);
-
- if(done)
- break;
- }
-
- FIRE_RING(chan);
- nvfx_state_emit(nvfx);
- }
-
- /* set data for the next instance, if any changed */
- for (i = 0; i < nvfx->vtxelt->num_per_instance; ++i)
- {
- struct nvfx_per_instance_element *ve = &nvfx->vtxelt->per_instance[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[ve->base.vertex_buffer_index];
-
- if(++per_instance[i].step == ve->instance_divisor)
- {
- float v[4];
- per_instance[i].map += vb->stride;
- per_instance[i].step = 0;
-
- nvfx->vtxelt->per_instance[i].base.fetch_rgba_float(v, per_instance[i].map, 0, 0);
- nvfx_emit_vtx_attr(chan, eng3d,
- nvfx->vtxelt->per_instance[i].base.idx,
- v,
- nvfx->vtxelt->per_instance[i].base.ncomp);
- }
- }
- }
-}
+++ /dev/null
-#include "pipe/p_context.h"
-
-#include "nvfx_context.h"
-
-struct nvfx_query {
- struct list_head list;
- struct nouveau_resource *object;
- unsigned type;
- boolean ready;
- uint64_t result;
-};
-
-static INLINE struct nvfx_query *
-nvfx_query(struct pipe_query *pipe)
-{
- return (struct nvfx_query *)pipe;
-}
-
-static struct pipe_query *
-nvfx_query_create(struct pipe_context *pipe, unsigned query_type)
-{
- struct nvfx_query *q;
-
- q = CALLOC(1, sizeof(struct nvfx_query));
- q->type = query_type;
-
- assert(q->type == PIPE_QUERY_OCCLUSION_COUNTER);
-
- return (struct pipe_query *)q;
-}
-
-static void
-nvfx_query_destroy(struct pipe_context *pipe, struct pipe_query *pq)
-{
- struct nvfx_query *q = nvfx_query(pq);
-
- if (q->object)
- {
- nouveau_resource_free(&q->object);
- LIST_DEL(&q->list);
- }
- FREE(q);
-}
-
-static void
-nvfx_query_begin(struct pipe_context *pipe, struct pipe_query *pq)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_query *q = nvfx_query(pq);
- struct nvfx_screen *screen = nvfx->screen;
- struct nouveau_channel *chan = screen->base.channel;
- struct nouveau_grobj *eng3d = screen->eng3d;
- uint64_t tmp;
-
- assert(!nvfx->query);
-
- /* Happens when end_query() is called, then another begin_query()
- * without querying the result in-between. For now we'll wait for
- * the existing query to notify completion, but it could be better.
- */
- if (q->object)
- pipe->get_query_result(pipe, pq, 1, (void*)&tmp);
-
- while (nouveau_resource_alloc(nvfx->screen->query_heap, 1, NULL, &q->object))
- {
- struct nvfx_query* oldestq;
- assert(!LIST_IS_EMPTY(&nvfx->screen->query_list));
- oldestq = LIST_ENTRY(struct nvfx_query, nvfx->screen->query_list.next, list);
- pipe->get_query_result(pipe, (struct pipe_query*)oldestq, 1, (void*)&tmp);
- }
-
- LIST_ADDTAIL(&q->list, &nvfx->screen->query_list);
-
- nouveau_notifier_reset(nvfx->screen->query, q->object->start);
-
- BEGIN_RING(chan, eng3d, NV30_3D_QUERY_RESET, 1);
- OUT_RING(chan, 1);
- BEGIN_RING(chan, eng3d, NV30_3D_QUERY_ENABLE, 1);
- OUT_RING(chan, 1);
-
- q->ready = FALSE;
-
- nvfx->query = pq;
-}
-
-static void
-nvfx_query_end(struct pipe_context *pipe, struct pipe_query *pq)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct nvfx_query *q = nvfx_query(pq);
-
- assert(nvfx->query == pq);
-
- BEGIN_RING(chan, eng3d, NV30_3D_QUERY_GET, 1);
- OUT_RING (chan, (0x01 << NV30_3D_QUERY_GET_UNK24__SHIFT) |
- ((q->object->start * 32) << NV30_3D_QUERY_GET_OFFSET__SHIFT));
- BEGIN_RING(chan, eng3d, NV30_3D_QUERY_ENABLE, 1);
- OUT_RING(chan, 0);
- FIRE_RING(chan);
-
- nvfx->query = 0;
-}
-
-static boolean
-nvfx_query_result(struct pipe_context *pipe, struct pipe_query *pq,
- boolean wait, union pipe_query_result *vresult)
-{
- uint64_t *result = (uint64_t *)vresult;
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_query *q = nvfx_query(pq);
-
- if (!q->ready) {
- unsigned status;
-
- status = nouveau_notifier_status(nvfx->screen->query,
- q->object->start);
- if (status != NV_NOTIFY_STATE_STATUS_COMPLETED) {
- if (wait == FALSE)
- return FALSE;
-
- nouveau_notifier_wait_status(nvfx->screen->query,
- q->object->start,
- NV_NOTIFY_STATE_STATUS_COMPLETED, 0);
- }
-
- q->result = nouveau_notifier_return_val(nvfx->screen->query,
- q->object->start);
- q->ready = TRUE;
- nouveau_resource_free(&q->object);
- LIST_DEL(&q->list);
- }
-
- *result = q->result;
- return TRUE;
-}
-
-void
-nvfx_init_query_functions(struct nvfx_context *nvfx)
-{
- nvfx->pipe.create_query = nvfx_query_create;
- nvfx->pipe.destroy_query = nvfx_query_destroy;
- nvfx->pipe.begin_query = nvfx_query_begin;
- nvfx->pipe.end_query = nvfx_query_end;
- nvfx->pipe.get_query_result = nvfx_query_result;
-}
+++ /dev/null
-
-#include "pipe/p_context.h"
-#include "util/u_staging.h"
-#include "nvfx_resource.h"
-#include "nouveau/nouveau_screen.h"
-
-
-static struct pipe_resource *
-nvfx_resource_create(struct pipe_screen *screen,
- const struct pipe_resource *template)
-{
- if (template->target == PIPE_BUFFER)
- return nvfx_buffer_create(screen, template);
- else
- return nvfx_miptree_create(screen, template);
-}
-
-static void
-nvfx_resource_destroy(struct pipe_screen *screen, struct pipe_resource *pr)
-{
- if (pr->target == PIPE_BUFFER)
- return nvfx_buffer_destroy(screen, pr);
- else
- return nvfx_miptree_destroy(screen, pr);
-}
-
-static struct pipe_resource *
-nvfx_resource_from_handle(struct pipe_screen * screen,
- const struct pipe_resource *template,
- struct winsys_handle *whandle)
-{
- if (template->target == PIPE_BUFFER)
- return NULL;
- else
- return nvfx_miptree_from_handle(screen, template, whandle);
-}
-
-static boolean
-nvfx_resource_get_handle(struct pipe_screen *pscreen,
- struct pipe_resource *pr,
- struct winsys_handle *whandle)
-{
- struct nvfx_resource* res = (struct nvfx_resource*)pr;
-
- if (!res || !res->bo)
- return FALSE;
-
- return nouveau_screen_bo_get_handle(pscreen, res->bo, nvfx_subresource_pitch(pr, 0), whandle);
-}
-
-void
-nvfx_init_resource_functions(struct pipe_context *pipe)
-{
- pipe->create_surface = nvfx_miptree_surface_new;
- pipe->surface_destroy = nvfx_miptree_surface_del;
-}
-
-void
-nvfx_screen_init_resource_functions(struct pipe_screen *pscreen)
-{
- pscreen->resource_create = nvfx_resource_create;
- pscreen->resource_from_handle = nvfx_resource_from_handle;
- pscreen->resource_get_handle = nvfx_resource_get_handle;
- pscreen->resource_destroy = nvfx_resource_destroy;
- pscreen->user_buffer_create = nvfx_user_buffer_create;
-}
+++ /dev/null
-#ifndef NVFX_RESOURCE_H
-#define NVFX_RESOURCE_H
-
-#include "util/u_transfer.h"
-#include "util/u_format.h"
-#include "util/u_math.h"
-#include "util/u_double_list.h"
-#include "util/u_surfaces.h"
-#include "util/u_dirty_surfaces.h"
-#include <nouveau/nouveau_bo.h>
-
-struct pipe_resource;
-struct nv04_region;
-
-struct nvfx_resource {
- struct pipe_resource base;
- struct nouveau_bo *bo;
-};
-
-static INLINE
-struct nvfx_resource *nvfx_resource(struct pipe_resource *resource)
-{
- return (struct nvfx_resource *)resource;
-}
-
-#define NVFX_RESOURCE_FLAG_USER (NOUVEAU_RESOURCE_FLAG_DRV_PRIV << 0)
-
-/* is resource mapped into the GPU's address space (i.e. VRAM or GART) ? */
-static INLINE boolean
-nvfx_resource_mapped_by_gpu(struct pipe_resource *resource)
-{
- return nvfx_resource(resource)->bo->handle;
-}
-
-/* is resource in VRAM? */
-static inline int
-nvfx_resource_on_gpu(struct pipe_resource* pr)
-{
-#if 0
- // a compiler error here means you need to apply libdrm-nouveau-add-domain.patch to libdrm
- // TODO: return FALSE if not VRAM and on a PCI-E system
- return ((struct nvfx_resource*)pr)->bo->domain & (NOUVEAU_BO_VRAM | NOUVEAU_BO_GART);
-#else
- return TRUE;
-#endif
-}
-
-#define NVFX_MAX_TEXTURE_LEVELS 16
-
-struct nvfx_miptree {
- struct nvfx_resource base;
-
- unsigned linear_pitch; /* for linear textures, 0 for swizzled and compressed textures with level-dependent minimal pitch */
- unsigned face_size; /* 128-byte aligned face/total size */
- unsigned level_offset[NVFX_MAX_TEXTURE_LEVELS];
-
- struct util_surfaces surfaces;
-};
-
-struct nvfx_surface {
- struct pipe_surface base;
- unsigned pitch;
- unsigned offset;
-};
-
-static INLINE struct nouveau_bo *
-nvfx_surface_buffer(struct pipe_surface *surf)
-{
- struct nvfx_resource *mt = nvfx_resource(surf->texture);
-
- return mt->bo;
-}
-
-void
-nvfx_init_resource_functions(struct pipe_context *pipe);
-
-void
-nvfx_screen_init_resource_functions(struct pipe_screen *pscreen);
-
-
-/* Internal:
- */
-
-struct pipe_resource *
-nvfx_miptree_create(struct pipe_screen *pscreen, const struct pipe_resource *pt);
-
-void
-nvfx_miptree_destroy(struct pipe_screen *pscreen,
- struct pipe_resource *presource);
-
-struct pipe_resource *
-nvfx_miptree_from_handle(struct pipe_screen *pscreen,
- const struct pipe_resource *template,
- struct winsys_handle *whandle);
-
-void
-nvfx_miptree_surface_del(struct pipe_context *pipe, struct pipe_surface *ps);
-
-struct pipe_surface *
-nvfx_miptree_surface_new(struct pipe_context *pipe, struct pipe_resource *pt,
- const struct pipe_surface *surf_tmpl);
-
-/* only for miptrees, don't use for buffers */
-
-/* NOTE: for swizzled 3D textures, this just returns the offset of the mipmap level */
-static inline unsigned
-nvfx_subresource_offset(struct pipe_resource* pt, unsigned face, unsigned level, unsigned zslice)
-{
- if(pt->target == PIPE_BUFFER)
- return 0;
- else
- {
- struct nvfx_miptree *mt = (struct nvfx_miptree *)pt;
-
- unsigned offset = mt->level_offset[level];
- if (pt->target == PIPE_TEXTURE_CUBE)
- offset += mt->face_size * face;
- else if (pt->target == PIPE_TEXTURE_3D && mt->linear_pitch)
- offset += zslice * util_format_get_2d_size(pt->format, (mt->linear_pitch ? mt->linear_pitch : util_format_get_stride(pt->format, u_minify(pt->width0, level))), u_minify(pt->height0, level));
- return offset;
- }
-}
-
-static inline unsigned
-nvfx_subresource_pitch(struct pipe_resource* pt, unsigned level)
-{
- if(pt->target == PIPE_BUFFER)
- return ((struct nvfx_resource*)pt)->bo->size;
- else
- {
- struct nvfx_miptree *mt = (struct nvfx_miptree *)pt;
-
- if(mt->linear_pitch)
- return mt->linear_pitch;
- else
- return util_format_get_stride(pt->format, u_minify(pt->width0, level));
- }
-}
-
-struct nvfx_buffer
-{
- struct nvfx_resource base;
- uint8_t* data;
- unsigned size;
-
- /* the range of data not yet uploaded to the GPU bo */
- unsigned dirty_begin;
- unsigned dirty_end;
-
- /* whether all transfers were unsynchronized */
- boolean dirty_unsynchronized;
-
- /* whether it would have been profitable to upload
- * the latest updated data to the GPU immediately */
- boolean last_update_static;
-
- /* how many bytes we need to draw before we deem
- * the buffer to be static
- */
- long long bytes_to_draw_until_static;
-};
-
-static inline struct nvfx_buffer* nvfx_buffer(struct pipe_resource* pr)
-{
- return (struct nvfx_buffer*)pr;
-}
-
-/* this is an heuristic to determine whether we are better off uploading the
- * buffer to the GPU, or just continuing pushing it on the FIFO
- */
-static inline boolean nvfx_buffer_seems_static(struct nvfx_buffer* buffer)
-{
- return buffer->last_update_static
- || buffer->bytes_to_draw_until_static < 0;
-}
-
-struct pipe_resource *
-nvfx_buffer_create(struct pipe_screen *pscreen,
- const struct pipe_resource *template);
-
-void
-nvfx_buffer_destroy(struct pipe_screen *pscreen,
- struct pipe_resource *presource);
-
-struct pipe_resource *
-nvfx_user_buffer_create(struct pipe_screen *screen,
- void *ptr,
- unsigned bytes,
- unsigned usage);
-
-void
-nvfx_buffer_upload(struct nvfx_buffer* buffer);
-
-#endif
+++ /dev/null
-#include "pipe/p_screen.h"
-#include "pipe/p_state.h"
-#include "util/u_format.h"
-#include "util/u_format_s3tc.h"
-#include "vl/vl_decoder.h"
-#include "vl/vl_video_buffer.h"
-
-#include "nouveau/nouveau_screen.h"
-#include "nouveau/nv_object.xml.h"
-#include "nvfx_context.h"
-#include "nvfx_screen.h"
-#include "nvfx_resource.h"
-#include "nvfx_tex.h"
-
-#define NV30_3D_CHIPSET_3X_MASK 0x00000003
-#define NV34_3D_CHIPSET_3X_MASK 0x00000010
-#define NV35_3D_CHIPSET_3X_MASK 0x000001e0
-
-#define NV4X_GRCLASS4097_CHIPSETS 0x00000baf
-#define NV4X_GRCLASS4497_CHIPSETS 0x00005450
-#define NV6X_GRCLASS4497_CHIPSETS 0x00000088
-
-static int
-nvfx_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
-{
- struct nvfx_screen *screen = nvfx_screen(pscreen);
-
- switch (param) {
- case PIPE_CAP_NPOT_TEXTURES:
- return screen->advertise_npot;
- case PIPE_CAP_TWO_SIDED_STENCIL:
- return 1;
- case PIPE_CAP_SM3:
- /* TODO: >= nv4x support Shader Model 3.0 */
- return 0;
- case PIPE_CAP_GLSL_FEATURE_LEVEL:
- return 120;
- case PIPE_CAP_ANISOTROPIC_FILTER:
- return 1;
- case PIPE_CAP_POINT_SPRITE:
- return 1;
- case PIPE_CAP_MAX_RENDER_TARGETS:
- return screen->use_nv4x ? 4 : 1;
- case PIPE_CAP_OCCLUSION_QUERY:
- return 1;
- case PIPE_CAP_TIMER_QUERY:
- return 0;
- case PIPE_CAP_TEXTURE_SHADOW_MAP:
- return 1;
- case PIPE_CAP_TEXTURE_SWIZZLE:
- return 1;
- case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
- return 13;
- case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
- return 10;
- case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
- return 13;
- case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
- return !!screen->use_nv4x;
- case PIPE_CAP_BLEND_EQUATION_SEPARATE:
- return screen->advertise_blend_equation_separate;
- case PIPE_CAP_MAX_COMBINED_SAMPLERS:
- return 16;
- case PIPE_CAP_INDEP_BLEND_ENABLE:
- /* TODO: on nv40 we have separate color masks */
- /* TODO: nv40 mrt blending is probably broken */
- return 0;
- case PIPE_CAP_INDEP_BLEND_FUNC:
- return 0;
- case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
- return 0;
- case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
- case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
- case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
- case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
- case PIPE_CAP_VERTEX_COLOR_CLAMPED:
- return 1;
- case PIPE_CAP_DEPTH_CLIP_DISABLE:
- return 0; // TODO: implement depth clamp
- case PIPE_CAP_PRIMITIVE_RESTART:
- return 0; // TODO: implement primitive restart
- case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
- case PIPE_CAP_TGSI_INSTANCEID:
- case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
- case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
- case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
- case PIPE_CAP_SEAMLESS_CUBE_MAP:
- case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
- case PIPE_CAP_SHADER_STENCIL_EXPORT:
- case PIPE_CAP_MIN_TEXEL_OFFSET:
- case PIPE_CAP_MAX_TEXEL_OFFSET:
- case PIPE_CAP_CONDITIONAL_RENDER:
- case PIPE_CAP_TEXTURE_BARRIER:
- case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
- case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
- case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
- case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
- case PIPE_CAP_TGSI_CAN_COMPACT_VARYINGS:
- case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
- case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
- return 0;
- default:
- NOUVEAU_ERR("Warning: unknown PIPE_CAP %d\n", param);
- return 0;
- }
-}
-
-static int
-nvfx_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader, enum pipe_shader_cap param)
-{
- struct nvfx_screen *screen = nvfx_screen(pscreen);
-
- switch(shader) {
- case PIPE_SHADER_FRAGMENT:
- switch(param) {
- case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
- case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
- case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
- case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
- return 4096;
- case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
- /* FIXME: is it the dynamic (nv30:0/nv40:24) or the static
- value (nv30:0/nv40:4) ? */
- return screen->use_nv4x ? 4 : 0;
- case PIPE_SHADER_CAP_MAX_INPUTS:
- return screen->use_nv4x ? 12 : 10;
- case PIPE_SHADER_CAP_MAX_CONSTS:
- return screen->use_nv4x ? 224 : 32;
- case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
- return 1;
- case PIPE_SHADER_CAP_MAX_TEMPS:
- return 32;
- case PIPE_SHADER_CAP_MAX_ADDRS:
- return screen->use_nv4x ? 1 : 0;
- case PIPE_SHADER_CAP_MAX_PREDS:
- return 0; /* we could expose these, but nothing uses them */
- case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
- return 0;
- case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
- case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
- case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
- case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
- return 0;
- case PIPE_SHADER_CAP_SUBROUTINES:
- return screen->use_nv4x ? 1 : 0;
- case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
- return 16;
- default:
- break;
- }
- break;
- case PIPE_SHADER_VERTEX:
- switch(param) {
- case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
- case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
- return screen->use_nv4x ? 512 : 256;
- case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
- case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
- return screen->use_nv4x ? 512 : 0;
- case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
- /* FIXME: is it the dynamic (nv30:24/nv40:24) or the static
- value (nv30:1/nv40:4) ? */
- return screen->use_nv4x ? 4 : 1;
- case PIPE_SHADER_CAP_MAX_INPUTS:
- return 16;
- case PIPE_SHADER_CAP_MAX_CONSTS:
- /* - 6 is for clip planes; Gallium should be fixed to put
- * them in the vertex shader itself, so we don't need to reserve these */
- return (screen->use_nv4x ? 468 : 256) - 6;
- case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
- return 1;
- case PIPE_SHADER_CAP_MAX_TEMPS:
- return screen->use_nv4x ? 32 : 13;
- case PIPE_SHADER_CAP_MAX_ADDRS:
- return 2;
- case PIPE_SHADER_CAP_MAX_PREDS:
- return 0; /* we could expose these, but nothing uses them */
- case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
- return 1;
- case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
- case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
- case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
- return 0;
- case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
- return 1;
- case PIPE_SHADER_CAP_SUBROUTINES:
- return 1;
- case PIPE_SHADER_CAP_INTEGERS:
- return 0;
- case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
- return 0; /* We have 4 on nv40 - but unsupported currently */
- default:
- break;
- }
- break;
- default:
- break;
- }
- return 0;
-}
-
-static float
-nvfx_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
-{
- struct nvfx_screen *screen = nvfx_screen(pscreen);
-
- switch (param) {
- case PIPE_CAPF_MAX_LINE_WIDTH:
- case PIPE_CAPF_MAX_LINE_WIDTH_AA:
- return 10.0;
- case PIPE_CAPF_MAX_POINT_WIDTH:
- case PIPE_CAPF_MAX_POINT_WIDTH_AA:
- return 64.0;
- case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
- return screen->use_nv4x ? 16.0 : 8.0;
- case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
- return 15.0;
- default:
- NOUVEAU_ERR("Unknown PIPE_CAP %d\n", param);
- return 0.0;
- }
-}
-
-static int
-nvfx_screen_get_video_param(struct pipe_screen *screen,
- enum pipe_video_profile profile,
- enum pipe_video_cap param)
-{
- switch (param) {
- case PIPE_VIDEO_CAP_SUPPORTED:
- return vl_profile_supported(screen, profile);
- case PIPE_VIDEO_CAP_NPOT_TEXTURES:
- return 0;
- case PIPE_VIDEO_CAP_MAX_WIDTH:
- case PIPE_VIDEO_CAP_MAX_HEIGHT:
- return vl_video_buffer_max_size(screen);
- case PIPE_VIDEO_CAP_PREFERED_FORMAT:
- return PIPE_FORMAT_NV12;
- case PIPE_VIDEO_CAP_PREFERS_INTERLACED:
- return false;
- case PIPE_VIDEO_CAP_SUPPORTS_INTERLACED:
- return false;
- case PIPE_VIDEO_CAP_SUPPORTS_PROGRESSIVE:
- return true;
- default:
- return 0;
- }
-}
-
-static boolean
-nvfx_screen_is_format_supported(struct pipe_screen *pscreen,
- enum pipe_format format,
- enum pipe_texture_target target,
- unsigned sample_count,
- unsigned bind)
-{
- struct nvfx_screen *screen = nvfx_screen(pscreen);
-
- if (!util_format_is_supported(format, bind))
- return FALSE;
-
- if (sample_count > 1)
- return FALSE;
-
- if (bind & PIPE_BIND_RENDER_TARGET) {
- switch (format) {
- case PIPE_FORMAT_B8G8R8A8_UNORM:
- case PIPE_FORMAT_B8G8R8X8_UNORM:
- case PIPE_FORMAT_R8G8B8A8_UNORM:
- case PIPE_FORMAT_R8G8B8X8_UNORM:
- case PIPE_FORMAT_B5G6R5_UNORM:
- break;
- case PIPE_FORMAT_R16G16B16A16_FLOAT:
- if(!screen->advertise_fp16)
- return FALSE;
- break;
- case PIPE_FORMAT_R32G32B32A32_FLOAT:
- if(!screen->advertise_fp32)
- return FALSE;
- break;
- default:
- return FALSE;
- }
- }
-
- if (bind & PIPE_BIND_DEPTH_STENCIL) {
- switch (format) {
- case PIPE_FORMAT_S8_UINT_Z24_UNORM:
- case PIPE_FORMAT_X8Z24_UNORM:
- case PIPE_FORMAT_Z16_UNORM:
- break;
- default:
- return FALSE;
- }
- }
-
- if (bind & PIPE_BIND_SAMPLER_VIEW) {
- struct nvfx_texture_format* tf = &nvfx_texture_formats[format];
- if(util_format_is_s3tc(format) && !util_format_s3tc_enabled)
- return FALSE;
- if(format == PIPE_FORMAT_R16G16B16A16_FLOAT && !screen->advertise_fp16)
- return FALSE;
- if(format == PIPE_FORMAT_R32G32B32A32_FLOAT && !screen->advertise_fp32)
- return FALSE;
- if(screen->use_nv4x)
- {
- if(tf->fmt[4] < 0)
- return FALSE;
- }
- else
- {
- if(tf->fmt[0] < 0)
- return FALSE;
- }
- }
-
- // note that we do actually support everything through translate
- if (bind & PIPE_BIND_VERTEX_BUFFER) {
- unsigned type = nvfx_vertex_formats[format];
- if(!type)
- return FALSE;
- }
-
- if (bind & PIPE_BIND_INDEX_BUFFER) {
- // 8-bit indices supported, but not in hardware index buffer
- if(format != PIPE_FORMAT_R16_USCALED && format != PIPE_FORMAT_R32_USCALED)
- return FALSE;
- }
-
- if(bind & PIPE_BIND_STREAM_OUTPUT)
- return FALSE;
-
- return TRUE;
-}
-
-static void
-nvfx_screen_destroy(struct pipe_screen *pscreen)
-{
- struct nvfx_screen *screen = nvfx_screen(pscreen);
-
- nouveau_resource_destroy(&screen->vp_exec_heap);
- nouveau_resource_destroy(&screen->vp_data_heap);
- nouveau_resource_destroy(&screen->query_heap);
- nouveau_notifier_free(&screen->query);
- nouveau_notifier_free(&screen->sync);
- nouveau_grobj_free(&screen->eng3d);
- nvfx_screen_surface_takedown(pscreen);
- nouveau_bo_ref(NULL, &screen->fence);
-
- nouveau_screen_fini(&screen->base);
-
- FREE(pscreen);
-}
-
-static void nv30_screen_init(struct nvfx_screen *screen)
-{
- struct nouveau_channel *chan = screen->base.channel;
- struct nouveau_grobj *eng3d = screen->eng3d;
- int i;
-
- /* TODO: perhaps we should do some of this on nv40 too? */
- for (i=1; i<8; i++) {
- BEGIN_RING(chan, eng3d, NV30_3D_VIEWPORT_CLIP_HORIZ(i), 1);
- OUT_RING(chan, 0);
- BEGIN_RING(chan, eng3d, NV30_3D_VIEWPORT_CLIP_VERT(i), 1);
- OUT_RING(chan, 0);
- }
-
- BEGIN_RING(chan, eng3d, 0x220, 1);
- OUT_RING(chan, 1);
-
- BEGIN_RING(chan, eng3d, 0x03b0, 1);
- OUT_RING(chan, 0x00100000);
- BEGIN_RING(chan, eng3d, 0x1454, 1);
- OUT_RING(chan, 0);
- BEGIN_RING(chan, eng3d, 0x1d80, 1);
- OUT_RING(chan, 3);
- BEGIN_RING(chan, eng3d, 0x1450, 1);
- OUT_RING(chan, 0x00030004);
-
- /* NEW */
- BEGIN_RING(chan, eng3d, 0x1e98, 1);
- OUT_RING(chan, 0);
- BEGIN_RING(chan, eng3d, 0x17e0, 3);
- OUT_RING(chan, fui(0.0));
- OUT_RING(chan, fui(0.0));
- OUT_RING(chan, fui(1.0));
- BEGIN_RING(chan, eng3d, 0x1f80, 16);
- for (i=0; i<16; i++) {
- OUT_RING(chan, (i==8) ? 0x0000ffff : 0);
- }
-
- BEGIN_RING(chan, eng3d, 0x120, 3);
- OUT_RING(chan, 0);
- OUT_RING(chan, 1);
- OUT_RING(chan, 2);
-
- BEGIN_RING(chan, eng3d, 0x1d88, 1);
- OUT_RING(chan, 0x00001200);
-
- BEGIN_RING(chan, eng3d, NV30_3D_RC_ENABLE, 1);
- OUT_RING(chan, 0);
-
- BEGIN_RING(chan, eng3d, NV30_3D_DEPTH_RANGE_NEAR, 2);
- OUT_RING(chan, fui(0.0));
- OUT_RING(chan, fui(1.0));
-
- BEGIN_RING(chan, eng3d, NV30_3D_MULTISAMPLE_CONTROL, 1);
- OUT_RING(chan, 0xffff0000);
-
- /* enables use of vp rather than fixed-function somehow */
- BEGIN_RING(chan, eng3d, 0x1e94, 1);
- OUT_RING(chan, 0x13);
-}
-
-static void nv40_screen_init(struct nvfx_screen *screen)
-{
- struct nouveau_channel *chan = screen->base.channel;
- struct nouveau_grobj *eng3d = screen->eng3d;
-
- BEGIN_RING(chan, eng3d, NV40_3D_DMA_COLOR2, 2);
- OUT_RING(chan, screen->base.channel->vram->handle);
- OUT_RING(chan, screen->base.channel->vram->handle);
-
- BEGIN_RING(chan, eng3d, 0x1450, 1);
- OUT_RING(chan, 0x00000004);
-
- BEGIN_RING(chan, eng3d, 0x1ea4, 3);
- OUT_RING(chan, 0x00000010);
- OUT_RING(chan, 0x01000100);
- OUT_RING(chan, 0xff800006);
-
- /* vtxprog output routing */
- BEGIN_RING(chan, eng3d, 0x1fc4, 1);
- OUT_RING(chan, 0x06144321);
- BEGIN_RING(chan, eng3d, 0x1fc8, 2);
- OUT_RING(chan, 0xedcba987);
- OUT_RING(chan, 0x0000006f);
- BEGIN_RING(chan, eng3d, 0x1fd0, 1);
- OUT_RING(chan, 0x00171615);
- BEGIN_RING(chan, eng3d, 0x1fd4, 1);
- OUT_RING(chan, 0x001b1a19);
-
- BEGIN_RING(chan, eng3d, 0x1ef8, 1);
- OUT_RING(chan, 0x0020ffff);
- BEGIN_RING(chan, eng3d, 0x1d64, 1);
- OUT_RING(chan, 0x01d300d4);
- BEGIN_RING(chan, eng3d, 0x1e94, 1);
- OUT_RING(chan, 0x00000001);
-
- BEGIN_RING(chan, eng3d, NV40_3D_MIPMAP_ROUNDING, 1);
- OUT_RING(chan, NV40_3D_MIPMAP_ROUNDING_MODE_DOWN);
-}
-
-static unsigned
-nvfx_screen_get_vertex_buffer_flags(struct nvfx_screen* screen)
-{
- int vram_hack_default = 0;
- int vram_hack;
- // TODO: this is a bit of a guess; also add other cards that may need this hack.
- // It may also depend on the specific card or the AGP/PCIe chipset.
- if(screen->base.device->chipset == 0x47 /* G70 */
- || screen->base.device->chipset == 0x49 /* G71 */
- || screen->base.device->chipset == 0x46 /* G72 */
- )
- vram_hack_default = 1;
- vram_hack = debug_get_bool_option("NOUVEAU_VTXIDX_IN_VRAM", vram_hack_default);
-
- return vram_hack ? NOUVEAU_BO_VRAM : NOUVEAU_BO_GART;
-}
-
-static void nvfx_channel_flush_notify(struct nouveau_channel* chan)
-{
- struct nvfx_screen* screen = chan->user_private;
- struct nvfx_context* nvfx = screen->cur_ctx;
- if(nvfx)
- nvfx->relocs_needed = NVFX_RELOCATE_ALL;
-}
-
-struct pipe_screen *
-nvfx_screen_create(struct nouveau_device *dev)
-{
- static const unsigned query_sizes[] = {(4096 - 4 * 32) / 32, 3 * 1024 / 32, 2 * 1024 / 32, 1024 / 32};
- struct nvfx_screen *screen = CALLOC_STRUCT(nvfx_screen);
- struct nouveau_channel *chan;
- struct pipe_screen *pscreen;
- unsigned eng3d_class = 0;
- int ret, i;
-
- if (!screen)
- return NULL;
-
- pscreen = &screen->base.base;
-
- ret = nouveau_screen_init(&screen->base, dev);
- if (ret) {
- nvfx_screen_destroy(pscreen);
- return NULL;
- }
- chan = screen->base.channel;
- screen->cur_ctx = NULL;
- chan->user_private = screen;
- chan->flush_notify = nvfx_channel_flush_notify;
-
- pscreen->destroy = nvfx_screen_destroy;
- pscreen->get_param = nvfx_screen_get_param;
- pscreen->get_shader_param = nvfx_screen_get_shader_param;
- pscreen->get_paramf = nvfx_screen_get_paramf;
- pscreen->get_video_param = nvfx_screen_get_video_param;
- pscreen->is_format_supported = nvfx_screen_is_format_supported;
- pscreen->is_video_format_supported = vl_video_buffer_is_format_supported;
- pscreen->context_create = nvfx_create;
-
- ret = nouveau_bo_new(dev, NOUVEAU_BO_VRAM, 0, 4096, &screen->fence);
- if (ret) {
- nvfx_screen_destroy(pscreen);
- return NULL;
- }
-
- switch (dev->chipset & 0xf0) {
- case 0x30:
- if (NV30_3D_CHIPSET_3X_MASK & (1 << (dev->chipset & 0x0f)))
- eng3d_class = NV30_3D;
- else if (NV34_3D_CHIPSET_3X_MASK & (1 << (dev->chipset & 0x0f)))
- eng3d_class = NV34_3D;
- else if (NV35_3D_CHIPSET_3X_MASK & (1 << (dev->chipset & 0x0f)))
- eng3d_class = NV35_3D;
- break;
- case 0x40:
- if (NV4X_GRCLASS4097_CHIPSETS & (1 << (dev->chipset & 0x0f)))
- eng3d_class = NV40_3D;
- else if (NV4X_GRCLASS4497_CHIPSETS & (1 << (dev->chipset & 0x0f)))
- eng3d_class = NV44_3D;
- screen->is_nv4x = ~0;
- break;
- case 0x60:
- if (NV6X_GRCLASS4497_CHIPSETS & (1 << (dev->chipset & 0x0f)))
- eng3d_class = NV44_3D;
- screen->is_nv4x = ~0;
- break;
- }
-
- if (!eng3d_class) {
- NOUVEAU_ERR("Unknown nv3x/nv4x chipset: nv%02x\n", dev->chipset);
- return NULL;
- }
-
- screen->advertise_npot = !!screen->is_nv4x;
- screen->advertise_blend_equation_separate = !!screen->is_nv4x;
- screen->use_nv4x = screen->is_nv4x;
-
- if(screen->is_nv4x) {
- if(debug_get_bool_option("NVFX_SIMULATE_NV30", FALSE))
- screen->use_nv4x = 0;
- if(!debug_get_bool_option("NVFX_NPOT", TRUE))
- screen->advertise_npot = 0;
- if(!debug_get_bool_option("NVFX_BLEND_EQ_SEP", TRUE))
- screen->advertise_blend_equation_separate = 0;
- }
-
- screen->force_swtnl = debug_get_bool_option("NVFX_SWTNL", FALSE);
- screen->trace_draw = debug_get_bool_option("NVFX_TRACE_DRAW", FALSE);
-
- screen->buffer_allocation_cost = debug_get_num_option("NVFX_BUFFER_ALLOCATION_COST", 16384);
- screen->inline_cost_per_hardware_cost = atof(debug_get_option("NVFX_INLINE_COST_PER_HARDWARE_COST", "1.0"));
- screen->static_reuse_threshold = atof(debug_get_option("NVFX_STATIC_REUSE_THRESHOLD", "2.0"));
-
- /* We don't advertise these by default because filtering and blending doesn't work as
- * it should, due to several restrictions.
- * The only exception is fp16 on nv40.
- */
- screen->advertise_fp16 = debug_get_bool_option("NVFX_FP16", !!screen->use_nv4x);
- screen->advertise_fp32 = debug_get_bool_option("NVFX_FP32", 0);
-
- screen->vertex_buffer_reloc_flags = nvfx_screen_get_vertex_buffer_flags(screen);
-
- /* surely both nv3x and nv44 support index buffers too: find out how and test that */
- if(eng3d_class == NV40_3D)
- screen->index_buffer_reloc_flags = screen->vertex_buffer_reloc_flags;
-
- if(!screen->force_swtnl && screen->vertex_buffer_reloc_flags == screen->index_buffer_reloc_flags)
- screen->base.vertex_buffer_flags = screen->base.index_buffer_flags = screen->vertex_buffer_reloc_flags;
-
- nvfx_screen_init_resource_functions(pscreen);
-
- ret = nouveau_grobj_alloc(chan, 0xbeef3097, eng3d_class, &screen->eng3d);
- if (ret) {
- NOUVEAU_ERR("Error creating 3D object: %d\n", ret);
- return FALSE;
- }
-
- /* 2D engine setup */
- nvfx_screen_surface_init(pscreen);
-
- /* Notifier for sync purposes */
- ret = nouveau_notifier_alloc(chan, 0xbeef0301, 1, &screen->sync);
- if (ret) {
- NOUVEAU_ERR("Error creating notifier object: %d\n", ret);
- nvfx_screen_destroy(pscreen);
- return NULL;
- }
-
- /* Query objects */
- for(i = 0; i < sizeof(query_sizes) / sizeof(query_sizes[0]); ++i)
- {
- ret = nouveau_notifier_alloc(chan, 0xbeef0302, query_sizes[i], &screen->query);
- if(!ret)
- break;
- }
-
- if (ret) {
- NOUVEAU_ERR("Error initialising query objects: %d\n", ret);
- nvfx_screen_destroy(pscreen);
- return NULL;
- }
-
- ret = nouveau_resource_init(&screen->query_heap, 0, query_sizes[i]);
- if (ret) {
- NOUVEAU_ERR("Error initialising query object heap: %d\n", ret);
- nvfx_screen_destroy(pscreen);
- return NULL;
- }
-
- LIST_INITHEAD(&screen->query_list);
-
- /* Vtxprog resources */
- if (nouveau_resource_init(&screen->vp_exec_heap, 0, screen->use_nv4x ? 512 : 256) ||
- nouveau_resource_init(&screen->vp_data_heap, 0, screen->use_nv4x ? 468 : 256)) {
- nvfx_screen_destroy(pscreen);
- return NULL;
- }
-
- BIND_RING(chan, screen->eng3d, 7);
-
- /* Static eng3d initialisation */
- /* note that we just started using the channel, so we must have space in the pushbuffer */
- BEGIN_RING(chan, screen->eng3d, NV30_3D_DMA_NOTIFY, 1);
- OUT_RING(chan, screen->sync->handle);
- BEGIN_RING(chan, screen->eng3d, NV30_3D_DMA_TEXTURE0, 2);
- OUT_RING(chan, chan->vram->handle);
- OUT_RING(chan, chan->gart->handle);
- BEGIN_RING(chan, screen->eng3d, NV30_3D_DMA_COLOR1, 1);
- OUT_RING(chan, chan->vram->handle);
- BEGIN_RING(chan, screen->eng3d, NV30_3D_DMA_COLOR0, 2);
- OUT_RING(chan, chan->vram->handle);
- OUT_RING(chan, chan->vram->handle);
- BEGIN_RING(chan, screen->eng3d, NV30_3D_DMA_VTXBUF0, 2);
- OUT_RING(chan, chan->vram->handle);
- OUT_RING(chan, chan->gart->handle);
-
- BEGIN_RING(chan, screen->eng3d, NV30_3D_DMA_FENCE, 2);
- OUT_RING(chan, 0);
- OUT_RING(chan, screen->query->handle);
-
- BEGIN_RING(chan, screen->eng3d, NV30_3D_DMA_UNK1AC, 2);
- OUT_RING(chan, chan->vram->handle);
- OUT_RING(chan, chan->vram->handle);
-
- if(!screen->is_nv4x)
- nv30_screen_init(screen);
- else
- nv40_screen_init(screen);
-
- return pscreen;
-}
+++ /dev/null
-#ifndef __NVFX_SCREEN_H__
-#define __NVFX_SCREEN_H__
-
-#include "pipe/p_compiler.h"
-#include "util/u_double_list.h"
-#include "nouveau/nouveau_screen.h"
-
-struct pipe_screen;
-
-struct nvfx_screen {
- struct nouveau_screen base;
-
- struct nouveau_bo *fence;
-
- struct nvfx_context *cur_ctx;
-
- unsigned is_nv4x; /* either 0 or ~0 */
- unsigned use_nv4x; /* either 0 or ~0 */
- boolean force_swtnl;
- boolean trace_draw;
- unsigned vertex_buffer_reloc_flags;
- unsigned index_buffer_reloc_flags;
- unsigned advertise_fp16;
- unsigned advertise_fp32;
- unsigned advertise_npot;
- unsigned advertise_blend_equation_separate;
-
- /* HW graphics objects */
- struct nouveau_grobj *eng3d;
- struct nouveau_notifier *sync;
-
- /* Query object resources */
- struct nouveau_notifier *query;
- struct nouveau_resource *query_heap;
- struct list_head query_list;
-
- /* Vtxprog resources */
- struct nouveau_resource *vp_exec_heap;
- struct nouveau_resource *vp_data_heap;
-
- struct nv04_2d_context* eng2d;
-
- /* Once the amount of bytes drawn from the buffer reaches the updated size times this value,
- * we will assume that the buffer will be drawn an huge number of times before the
- * next modification
- */
- float static_reuse_threshold;
-
- /* Cost of allocating a buffer in terms of the cost of copying a byte to an hardware buffer */
- unsigned buffer_allocation_cost;
-
- /* inline_cost/hardware_cost conversion ration */
- float inline_cost_per_hardware_cost;
-};
-
-static INLINE struct nvfx_screen *
-nvfx_screen(struct pipe_screen *screen)
-{
- return (struct nvfx_screen *)screen;
-}
-
-int nvfx_screen_surface_init(struct pipe_screen *pscreen);
-void nvfx_screen_surface_takedown(struct pipe_screen *pscreen);
-
-#endif
+++ /dev/null
-#ifndef __NVFX_SHADER_H__
-#define __NVFX_SHADER_H__
-
-#include <stdint.h>
-
-#include "pipe/p_compiler.h"
-
-#define NVFX_SWZ_IDENTITY ((3 << 6) | (2 << 4) | (1 << 2) | (0 << 0))
-
-/* this will resolve to either the NV30 or the NV40 version
- * depending on the current hardware */
-/* unusual, but very fast and compact method */
-#define NVFX_VP(c) ((NV30_VP_##c) + (nvfx->is_nv4x & ((NV40_VP_##c) - (NV30_VP_##c))))
-
-#define NVFX_VP_INST_SLOT_VEC 0
-#define NVFX_VP_INST_SLOT_SCA 1
-
-#define NVFX_VP_INST_IN_POS 0 /* These seem to match the bindings specified in */
-#define NVFX_VP_INST_IN_WEIGHT 1 /* the ARB_v_p spec (2.14.3.1) */
-#define NVFX_VP_INST_IN_NORMAL 2
-#define NVFX_VP_INST_IN_COL0 3 /* Should probably confirm them all though */
-#define NVFX_VP_INST_IN_COL1 4
-#define NVFX_VP_INST_IN_FOGC 5
-#define NVFX_VP_INST_IN_TC0 8
-#define NVFX_VP_INST_IN_TC(n) (8+n)
-
-#define NVFX_VP_INST_SCA_OP_NOP 0x00
-#define NVFX_VP_INST_SCA_OP_MOV 0x01
-#define NVFX_VP_INST_SCA_OP_RCP 0x02
-#define NVFX_VP_INST_SCA_OP_RCC 0x03
-#define NVFX_VP_INST_SCA_OP_RSQ 0x04
-#define NVFX_VP_INST_SCA_OP_EXP 0x05
-#define NVFX_VP_INST_SCA_OP_LOG 0x06
-#define NVFX_VP_INST_SCA_OP_LIT 0x07
-#define NVFX_VP_INST_SCA_OP_BRA 0x09
-#define NVFX_VP_INST_SCA_OP_CAL 0x0B
-#define NVFX_VP_INST_SCA_OP_RET 0x0C
-#define NVFX_VP_INST_SCA_OP_LG2 0x0D
-#define NVFX_VP_INST_SCA_OP_EX2 0x0E
-#define NVFX_VP_INST_SCA_OP_SIN 0x0F
-#define NVFX_VP_INST_SCA_OP_COS 0x10
-
-#define NV40_VP_INST_SCA_OP_PUSHA 0x13
-#define NV40_VP_INST_SCA_OP_POPA 0x14
-
-#define NVFX_VP_INST_VEC_OP_NOP 0x00
-#define NVFX_VP_INST_VEC_OP_MOV 0x01
-#define NVFX_VP_INST_VEC_OP_MUL 0x02
-#define NVFX_VP_INST_VEC_OP_ADD 0x03
-#define NVFX_VP_INST_VEC_OP_MAD 0x04
-#define NVFX_VP_INST_VEC_OP_DP3 0x05
-#define NVFX_VP_INST_VEC_OP_DPH 0x06
-#define NVFX_VP_INST_VEC_OP_DP4 0x07
-#define NVFX_VP_INST_VEC_OP_DST 0x08
-#define NVFX_VP_INST_VEC_OP_MIN 0x09
-#define NVFX_VP_INST_VEC_OP_MAX 0x0A
-#define NVFX_VP_INST_VEC_OP_SLT 0x0B
-#define NVFX_VP_INST_VEC_OP_SGE 0x0C
-#define NVFX_VP_INST_VEC_OP_ARL 0x0D
-#define NVFX_VP_INST_VEC_OP_FRC 0x0E
-#define NVFX_VP_INST_VEC_OP_FLR 0x0F
-#define NVFX_VP_INST_VEC_OP_SEQ 0x10
-#define NVFX_VP_INST_VEC_OP_SFL 0x11
-#define NVFX_VP_INST_VEC_OP_SGT 0x12
-#define NVFX_VP_INST_VEC_OP_SLE 0x13
-#define NVFX_VP_INST_VEC_OP_SNE 0x14
-#define NVFX_VP_INST_VEC_OP_STR 0x15
-#define NVFX_VP_INST_VEC_OP_SSG 0x16
-#define NVFX_VP_INST_VEC_OP_ARR 0x17
-#define NVFX_VP_INST_VEC_OP_ARA 0x18
-
-#define NV40_VP_INST_VEC_OP_TXL 0x19
-
-/* DWORD 3 */
-#define NVFX_VP_INST_LAST (1 << 0)
-
-/*
- * Each fragment program opcode appears to be comprised of 4 32-bit values.
- *
- * 0: OPDEST
- * 0: program end
- * 1-6: destination register
- * 7: destination register is fp16?? (use for outputs)
- * 8: set condition code
- * 9: writemask x
- * 10: writemask y
- * 11: writemask z
- * 12: writemask w
- * 13-16: source attribute register number (e.g. COL0)
- * 17-20: texture unit number
- * 21: expand value on texture operation (x -> 2x - 1)
- * 22-23: precision 0 = fp32, 1 = fp16, 2 = s1.10 fixed, 3 = s0.8 fixed (nv40-only))
- * 24-29: opcode
- * 30: no destination
- * 31: saturate
- * 1 - SRC0
- * 0-17: see common source fields
- * 18: execute if condition code less
- * 19: execute if condition code equal
- * 20: execute if condition code greater
- * 21-22: condition code swizzle x source component
- * 23-24: condition code swizzle y source component
- * 25-26: condition code swizzle z source component
- * 27-28: condition code swizzle w source component
- * 29: source 0 absolute
- * 30: always 0 in renouveau tests
- * 31: always 0 in renouveau tests
- * 2 - SRC1
- * 0-17: see common source fields
- * 18: source 1 absolute
- * 19-20: input precision 0 = fp32, 1 = fp16, 2 = s1.10 fixed, 3 = ???
- * 21-27: always 0 in renouveau tests
- * 28-30: scale (0 = 1x, 1 = 2x, 2 = 4x, 3 = 8x, 4 = ???, 5, = 1/2, 6 = 1/4, 7 = 1/8)
- * 31: opcode is branch
- * 3 - SRC2
- * 0-17: see common source fields
- * 18: source 2 absolute
- * 19-29: address register displacement
- * 30: use index register
- * 31: disable perspective-correct interpolation?
- *
-* Common fields of 0, 1, 2 - SRC
- * 0-1: source register type (0 = temp, 1 = input, 2 = immediate, 3 = ???)
- * 2-7: source temp register index
- * 8: source register is fp16??
- * 9-10: source swizzle x source component
- * 11-12: source swizzle y source component
- * 13-14: source swizzle z source component
- * 15-16: source swizzle w source component
- * 17: negate
-
- * There appears to be no special difference between result regs and temp regs.
- * result.color == R0.xyzw
- * result.depth == R1.z
- * When the fragprog contains instructions to write depth, NV30_TCL_PRIMITIVE_3D_UNK1D78=0
- * otherwise it is set to 1.
- *
- * Constants are inserted directly after the instruction that uses them.
- *
- * It appears that it's not possible to use two input registers in one
- * instruction as the input sourcing is done in the instruction dword
- * and not the source selection dwords. As such instructions such as:
- *
- * ADD result.color, fragment.color, fragment.texcoord[0];
- *
- * must be split into two MOV's and then an ADD (nvidia does this) but
- * I'm not sure why it's not just one MOV and then source the second input
- * in the ADD instruction..
- *
- * Negation of the full source is done with NV30_FP_REG_NEGATE, arbitrary
- * negation requires multiplication with a const.
- *
- * Arbitrary swizzling is supported with the exception of SWIZZLE_ZERO/SWIZZLE_ONE
- * The temp/result regs appear to be initialised to (0.0, 0.0, 0.0, 0.0) as SWIZZLE_ZERO
- * is implemented simply by not writing to the relevant components of the destination.
- *
- * Conditional execution
- * TODO
- *
- * Non-native instructions:
- * LIT
- * LRP - MAD+MAD
- * SUB - ADD, negate second source
- * RSQ - LG2 + EX2
- * POW - LG2 + MUL + EX2
- * SCS - COS + SIN
- * XPD
- *
- * NV40 Looping
- * Loops appear to be fairly expensive on NV40 at least, the proprietary
- * driver goes to a lot of effort to avoid using the native looping
- * instructions. If the total number of *executed* instructions between
- * REP/ENDREP or LOOP/ENDLOOP is <=500, the driver will unroll the loop.
- * The maximum loop count is 255.
- *
- */
-
-//== Opcode / Destination selection ==
-#define NVFX_FP_OP_PROGRAM_END (1 << 0)
-#define NVFX_FP_OP_OUT_REG_SHIFT 1
-#define NV30_FP_OP_OUT_REG_MASK (31 << 1) /* uncertain */
-#define NV40_FP_OP_OUT_REG_MASK (63 << 1)
-/* Needs to be set when writing outputs to get expected result.. */
-#define NVFX_FP_OP_OUT_REG_HALF (1 << 7)
-#define NVFX_FP_OP_COND_WRITE_ENABLE (1 << 8)
-#define NVFX_FP_OP_OUTMASK_SHIFT 9
-#define NVFX_FP_OP_OUTMASK_MASK (0xF << 9)
-# define NVFX_FP_OP_OUT_X (1<<9)
-# define NVFX_FP_OP_OUT_Y (1<<10)
-# define NVFX_FP_OP_OUT_Z (1<<11)
-# define NVFX_FP_OP_OUT_W (1<<12)
-/* Uncertain about these, especially the input_src values.. it's possible that
- * they can be dynamically changed.
- */
-#define NVFX_FP_OP_INPUT_SRC_SHIFT 13
-#define NVFX_FP_OP_INPUT_SRC_MASK (15 << 13)
-# define NVFX_FP_OP_INPUT_SRC_POSITION 0x0
-# define NVFX_FP_OP_INPUT_SRC_COL0 0x1
-# define NVFX_FP_OP_INPUT_SRC_COL1 0x2
-# define NVFX_FP_OP_INPUT_SRC_FOGC 0x3
-# define NVFX_FP_OP_INPUT_SRC_TC0 0x4
-# define NVFX_FP_OP_INPUT_SRC_TC(n) (0x4 + n)
-# define NV40_FP_OP_INPUT_SRC_FACING 0xE
-#define NVFX_FP_OP_TEX_UNIT_SHIFT 17
-#define NVFX_FP_OP_TEX_UNIT_MASK (0xF << 17) /* guess */
-#define NVFX_FP_OP_PRECISION_SHIFT 22
-#define NVFX_FP_OP_PRECISION_MASK (3 << 22)
-# define NVFX_FP_PRECISION_FP32 0
-# define NVFX_FP_PRECISION_FP16 1
-# define NVFX_FP_PRECISION_FX12 2
-#define NVFX_FP_OP_OPCODE_SHIFT 24
-#define NVFX_FP_OP_OPCODE_MASK (0x3F << 24)
-/* NV30/NV40 fragment program opcodes */
-#define NVFX_FP_OP_OPCODE_NOP 0x00
-#define NVFX_FP_OP_OPCODE_MOV 0x01
-#define NVFX_FP_OP_OPCODE_MUL 0x02
-#define NVFX_FP_OP_OPCODE_ADD 0x03
-#define NVFX_FP_OP_OPCODE_MAD 0x04
-#define NVFX_FP_OP_OPCODE_DP3 0x05
-#define NVFX_FP_OP_OPCODE_DP4 0x06
-#define NVFX_FP_OP_OPCODE_DST 0x07
-#define NVFX_FP_OP_OPCODE_MIN 0x08
-#define NVFX_FP_OP_OPCODE_MAX 0x09
-#define NVFX_FP_OP_OPCODE_SLT 0x0A
-#define NVFX_FP_OP_OPCODE_SGE 0x0B
-#define NVFX_FP_OP_OPCODE_SLE 0x0C
-#define NVFX_FP_OP_OPCODE_SGT 0x0D
-#define NVFX_FP_OP_OPCODE_SNE 0x0E
-#define NVFX_FP_OP_OPCODE_SEQ 0x0F
-#define NVFX_FP_OP_OPCODE_FRC 0x10
-#define NVFX_FP_OP_OPCODE_FLR 0x11
-#define NVFX_FP_OP_OPCODE_KIL 0x12
-#define NVFX_FP_OP_OPCODE_PK4B 0x13
-#define NVFX_FP_OP_OPCODE_UP4B 0x14
-#define NVFX_FP_OP_OPCODE_DDX 0x15 /* can only write XY */
-#define NVFX_FP_OP_OPCODE_DDY 0x16 /* can only write XY */
-#define NVFX_FP_OP_OPCODE_TEX 0x17
-#define NVFX_FP_OP_OPCODE_TXP 0x18
-#define NVFX_FP_OP_OPCODE_TXD 0x19
-#define NVFX_FP_OP_OPCODE_RCP 0x1A
-#define NVFX_FP_OP_OPCODE_EX2 0x1C
-#define NVFX_FP_OP_OPCODE_LG2 0x1D
-#define NVFX_FP_OP_OPCODE_STR 0x20
-#define NVFX_FP_OP_OPCODE_SFL 0x21
-#define NVFX_FP_OP_OPCODE_COS 0x22
-#define NVFX_FP_OP_OPCODE_SIN 0x23
-#define NVFX_FP_OP_OPCODE_PK2H 0x24
-#define NVFX_FP_OP_OPCODE_UP2H 0x25
-#define NVFX_FP_OP_OPCODE_PK4UB 0x27
-#define NVFX_FP_OP_OPCODE_UP4UB 0x28
-#define NVFX_FP_OP_OPCODE_PK2US 0x29
-#define NVFX_FP_OP_OPCODE_UP2US 0x2A
-#define NVFX_FP_OP_OPCODE_DP2A 0x2E
-#define NVFX_FP_OP_OPCODE_TXB 0x31
-#define NVFX_FP_OP_OPCODE_DIV 0x3A
-
-/* NV30 only fragment program opcodes */
-#define NVFX_FP_OP_OPCODE_RSQ_NV30 0x1B
-#define NVFX_FP_OP_OPCODE_LIT_NV30 0x1E
-#define NVFX_FP_OP_OPCODE_LRP_NV30 0x1F
-#define NVFX_FP_OP_OPCODE_POW_NV30 0x26
-#define NVFX_FP_OP_OPCODE_RFL_NV30 0x36
-
-/* NV40 only fragment program opcodes */
-#define NVFX_FP_OP_OPCODE_TXL_NV40 0x2F
-#define NVFX_FP_OP_OPCODE_LITEX2_NV40 0x3C
-
-/* The use of these instructions appears to be indicated by bit 31 of DWORD 2.*/
-#define NV40_FP_OP_BRA_OPCODE_BRK 0x0
-#define NV40_FP_OP_BRA_OPCODE_CAL 0x1
-#define NV40_FP_OP_BRA_OPCODE_IF 0x2
-#define NV40_FP_OP_BRA_OPCODE_LOOP 0x3
-#define NV40_FP_OP_BRA_OPCODE_REP 0x4
-#define NV40_FP_OP_BRA_OPCODE_RET 0x5
-
-#define NV40_FP_OP_OUT_NONE (1 << 30)
-#define NVFX_FP_OP_OUT_SAT (1 << 31)
-
-/* high order bits of SRC0 */
-#define NVFX_FP_OP_SRC0_ABS (1 << 29)
-#define NVFX_FP_OP_COND_SWZ_W_SHIFT 27
-#define NVFX_FP_OP_COND_SWZ_W_MASK (3 << 27)
-#define NVFX_FP_OP_COND_SWZ_Z_SHIFT 25
-#define NVFX_FP_OP_COND_SWZ_Z_MASK (3 << 25)
-#define NVFX_FP_OP_COND_SWZ_Y_SHIFT 23
-#define NVFX_FP_OP_COND_SWZ_Y_MASK (3 << 23)
-#define NVFX_FP_OP_COND_SWZ_X_SHIFT 21
-#define NVFX_FP_OP_COND_SWZ_X_MASK (3 << 21)
-#define NVFX_FP_OP_COND_SWZ_ALL_SHIFT 21
-#define NVFX_FP_OP_COND_SWZ_ALL_MASK (0xFF << 21)
-#define NVFX_FP_OP_COND_SHIFT 18
-#define NVFX_FP_OP_COND_MASK (0x07 << 18)
-# define NVFX_FP_OP_COND_FL 0
-# define NVFX_FP_OP_COND_LT 1
-# define NVFX_FP_OP_COND_EQ 2
-# define NVFX_FP_OP_COND_LE 3
-# define NVFX_FP_OP_COND_GT 4
-# define NVFX_FP_OP_COND_NE 5
-# define NVFX_FP_OP_COND_GE 6
-# define NVFX_FP_OP_COND_TR 7
-
-/* high order bits of SRC1 */
-#define NV40_FP_OP_OPCODE_IS_BRANCH (1<<31)
-#define NVFX_FP_OP_DST_SCALE_SHIFT 28
-#define NVFX_FP_OP_DST_SCALE_MASK (3 << 28)
-#define NVFX_FP_OP_DST_SCALE_1X 0
-#define NVFX_FP_OP_DST_SCALE_2X 1
-#define NVFX_FP_OP_DST_SCALE_4X 2
-#define NVFX_FP_OP_DST_SCALE_8X 3
-#define NVFX_FP_OP_DST_SCALE_INV_2X 5
-#define NVFX_FP_OP_DST_SCALE_INV_4X 6
-#define NVFX_FP_OP_DST_SCALE_INV_8X 7
-#define NVFX_FP_OP_SRC1_ABS (1 << 18)
-
-/* SRC1 LOOP */
-#define NV40_FP_OP_LOOP_INCR_SHIFT 19
-#define NV40_FP_OP_LOOP_INCR_MASK (0xFF << 19)
-#define NV40_FP_OP_LOOP_INDEX_SHIFT 10
-#define NV40_FP_OP_LOOP_INDEX_MASK (0xFF << 10)
-#define NV40_FP_OP_LOOP_COUNT_SHIFT 2
-#define NV40_FP_OP_LOOP_COUNT_MASK (0xFF << 2)
-
-/* SRC1 IF: absolute offset in dwords */
-#define NV40_FP_OP_ELSE_OFFSET_SHIFT 0
-#define NV40_FP_OP_ELSE_OFFSET_MASK (0x7FFFFFFF << 0)
-
-/* SRC1 CAL */
-#define NV40_FP_OP_SUB_OFFSET_SHIFT 0
-#define NV40_FP_OP_SUB_OFFSET_MASK (0x7FFFFFFF << 0)
-
-/* SRC1 REP
- * I have no idea why there are 3 count values here.. but they
- * have always been filled with the same value in my tests so
- * far..
- */
-#define NV40_FP_OP_REP_COUNT1_SHIFT 2
-#define NV40_FP_OP_REP_COUNT1_MASK (0xFF << 2)
-#define NV40_FP_OP_REP_COUNT2_SHIFT 10
-#define NV40_FP_OP_REP_COUNT2_MASK (0xFF << 10)
-#define NV40_FP_OP_REP_COUNT3_SHIFT 19
-#define NV40_FP_OP_REP_COUNT3_MASK (0xFF << 19)
-
-/* SRC2 REP/IF: absolute offset in dwords */
-#define NV40_FP_OP_END_OFFSET_SHIFT 0
-#define NV40_FP_OP_END_OFFSET_MASK (0x7FFFFFFF << 0)
-
-/* high order bits of SRC2 */
-#define NVFX_FP_OP_INDEX_INPUT (1 << 30)
-#define NV40_FP_OP_ADDR_INDEX_SHIFT 19
-#define NV40_FP_OP_ADDR_INDEX_MASK (0xF << 19)
-
-//== Register selection ==
-#define NVFX_FP_REG_TYPE_SHIFT 0
-#define NVFX_FP_REG_TYPE_MASK (3 << 0)
-# define NVFX_FP_REG_TYPE_TEMP 0
-# define NVFX_FP_REG_TYPE_INPUT 1
-# define NVFX_FP_REG_TYPE_CONST 2
-#define NVFX_FP_REG_SRC_SHIFT 2
-#define NV30_FP_REG_SRC_MASK (31 << 2)
-#define NV40_FP_REG_SRC_MASK (63 << 2)
-#define NVFX_FP_REG_SRC_HALF (1 << 8)
-#define NVFX_FP_REG_SWZ_ALL_SHIFT 9
-#define NVFX_FP_REG_SWZ_ALL_MASK (255 << 9)
-#define NVFX_FP_REG_SWZ_X_SHIFT 9
-#define NVFX_FP_REG_SWZ_X_MASK (3 << 9)
-#define NVFX_FP_REG_SWZ_Y_SHIFT 11
-#define NVFX_FP_REG_SWZ_Y_MASK (3 << 11)
-#define NVFX_FP_REG_SWZ_Z_SHIFT 13
-#define NVFX_FP_REG_SWZ_Z_MASK (3 << 13)
-#define NVFX_FP_REG_SWZ_W_SHIFT 15
-#define NVFX_FP_REG_SWZ_W_MASK (3 << 15)
-# define NVFX_FP_SWIZZLE_X 0
-# define NVFX_FP_SWIZZLE_Y 1
-# define NVFX_FP_SWIZZLE_Z 2
-# define NVFX_FP_SWIZZLE_W 3
-#define NVFX_FP_REG_NEGATE (1 << 17)
-
-#define NVFXSR_NONE 0
-#define NVFXSR_OUTPUT 1
-#define NVFXSR_INPUT 2
-#define NVFXSR_TEMP 3
-#define NVFXSR_CONST 5
-#define NVFXSR_IMM 6
-#define NVFXSR_RELOCATED 7
-
-#define NVFX_COND_FL 0
-#define NVFX_COND_LT 1
-#define NVFX_COND_EQ 2
-#define NVFX_COND_LE 3
-#define NVFX_COND_GT 4
-#define NVFX_COND_NE 5
-#define NVFX_COND_GE 6
-#define NVFX_COND_TR 7
-
-/* Yes, this are ordered differently... */
-
-#define NVFX_VP_MASK_X 8
-#define NVFX_VP_MASK_Y 4
-#define NVFX_VP_MASK_Z 2
-#define NVFX_VP_MASK_W 1
-#define NVFX_VP_MASK_ALL 0xf
-
-#define NVFX_FP_MASK_X 1
-#define NVFX_FP_MASK_Y 2
-#define NVFX_FP_MASK_Z 4
-#define NVFX_FP_MASK_W 8
-#define NVFX_FP_MASK_ALL 0xf
-
-#define NVFX_SWZ_X 0
-#define NVFX_SWZ_Y 1
-#define NVFX_SWZ_Z 2
-#define NVFX_SWZ_W 3
-
-#define swz(s,x,y,z,w) nvfx_src_swz((s), NVFX_SWZ_##x, NVFX_SWZ_##y, NVFX_SWZ_##z, NVFX_SWZ_##w)
-#define neg(s) nvfx_src_neg((s))
-#define abs(s) nvfx_src_abs((s))
-
-struct nvfx_reg {
- int8_t type;
- uint32_t index;
-};
-
-struct nvfx_src {
- struct nvfx_reg reg;
-
- uint8_t indirect : 1;
- uint8_t indirect_reg : 1;
- uint8_t indirect_swz : 2;
- uint8_t negate : 1;
- uint8_t abs : 1;
- uint8_t swz[4];
-};
-
-struct nvfx_insn
-{
- uint8_t op;
- char scale;
- int8_t unit;
- uint8_t mask;
- uint8_t cc_swz[4];
-
- uint8_t sat : 1;
- uint8_t cc_update : 1;
- uint8_t cc_update_reg : 1;
- uint8_t cc_test : 3;
- uint8_t cc_test_reg : 1;
-
- struct nvfx_reg dst;
- struct nvfx_src src[3];
-};
-
-static INLINE struct nvfx_insn
-nvfx_insn(boolean sat, unsigned op, int unit, struct nvfx_reg dst, unsigned mask, struct nvfx_src s0, struct nvfx_src s1, struct nvfx_src s2)
-{
- struct nvfx_insn insn = {
- .op = op,
- .scale = 0,
- .unit = unit,
- .sat = sat,
- .mask = mask,
- .cc_update = 0,
- .cc_update_reg = 0,
- .cc_test = NVFX_COND_TR,
- .cc_test_reg = 0,
- .cc_swz = { 0, 1, 2, 3 },
- .dst = dst,
- .src = {s0, s1, s2}
- };
- return insn;
-}
-
-static INLINE struct nvfx_reg
-nvfx_reg(int type, int index)
-{
- struct nvfx_reg temp = {
- .type = type,
- .index = index,
- };
- return temp;
-}
-
-static INLINE struct nvfx_src
-nvfx_src(struct nvfx_reg reg)
-{
- struct nvfx_src temp = {
- .reg = reg,
- .abs = 0,
- .negate = 0,
- .swz = { 0, 1, 2, 3 },
- .indirect = 0,
- };
- return temp;
-}
-
-static INLINE struct nvfx_src
-nvfx_src_swz(struct nvfx_src src, int x, int y, int z, int w)
-{
- struct nvfx_src dst = src;
-
- dst.swz[NVFX_SWZ_X] = src.swz[x];
- dst.swz[NVFX_SWZ_Y] = src.swz[y];
- dst.swz[NVFX_SWZ_Z] = src.swz[z];
- dst.swz[NVFX_SWZ_W] = src.swz[w];
- return dst;
-}
-
-static INLINE struct nvfx_src
-nvfx_src_neg(struct nvfx_src src)
-{
- src.negate = !src.negate;
- return src;
-}
-
-static INLINE struct nvfx_src
-nvfx_src_abs(struct nvfx_src src)
-{
- src.abs = 1;
- return src;
-}
-
-struct nvfx_relocation {
- unsigned location;
- unsigned target;
-};
-
-#endif
+++ /dev/null
-#include "pipe/p_state.h"
-#include "pipe/p_defines.h"
-#include "util/u_inlines.h"
-#include "util/u_framebuffer.h"
-
-#include "draw/draw_context.h"
-
-#include "tgsi/tgsi_parse.h"
-
-#include "nvfx_context.h"
-#include "nvfx_state.h"
-#include "nvfx_tex.h"
-
-static void *
-nvfx_blend_state_create(struct pipe_context *pipe,
- const struct pipe_blend_state *cso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_blend_state *bso = CALLOC(1, sizeof(*bso));
- struct nouveau_statebuf_builder sb = sb_init(bso->sb);
-
- if (cso->rt[0].blend_enable) {
- sb_method(sb, NV30_3D_BLEND_FUNC_ENABLE, 3);
- sb_data(sb, 1);
- sb_data(sb, (nvgl_blend_func(cso->rt[0].alpha_src_factor) << 16) |
- nvgl_blend_func(cso->rt[0].rgb_src_factor));
- sb_data(sb, nvgl_blend_func(cso->rt[0].alpha_dst_factor) << 16 |
- nvgl_blend_func(cso->rt[0].rgb_dst_factor));
- if(nvfx->screen->base.device->chipset < 0x40) {
- sb_method(sb, NV30_3D_BLEND_EQUATION, 1);
- sb_data(sb, nvgl_blend_eqn(cso->rt[0].rgb_func));
- } else {
- sb_method(sb, NV40_3D_BLEND_EQUATION, 1);
- sb_data(sb, nvgl_blend_eqn(cso->rt[0].alpha_func) << 16 |
- nvgl_blend_eqn(cso->rt[0].rgb_func));
- }
- } else {
- sb_method(sb, NV30_3D_BLEND_FUNC_ENABLE, 1);
- sb_data(sb, 0);
- }
-
- sb_method(sb, NV30_3D_COLOR_MASK, 1);
- sb_data(sb, (((cso->rt[0].colormask & PIPE_MASK_A) ? (0x01 << 24) : 0) |
- ((cso->rt[0].colormask & PIPE_MASK_R) ? (0x01 << 16) : 0) |
- ((cso->rt[0].colormask & PIPE_MASK_G) ? (0x01 << 8) : 0) |
- ((cso->rt[0].colormask & PIPE_MASK_B) ? (0x01 << 0) : 0)));
-
- /* TODO: add NV40 MRT color mask */
-
- if (cso->logicop_enable) {
- sb_method(sb, NV30_3D_COLOR_LOGIC_OP_ENABLE, 2);
- sb_data(sb, 1);
- sb_data(sb, nvgl_logicop_func(cso->logicop_func));
- } else {
- sb_method(sb, NV30_3D_COLOR_LOGIC_OP_ENABLE, 1);
- sb_data(sb, 0);
- }
-
- sb_method(sb, NV30_3D_DITHER_ENABLE, 1);
- sb_data(sb, cso->dither ? 1 : 0);
-
- bso->sb_len = sb_len(sb, bso->sb);
- bso->pipe = *cso;
- return (void *)bso;
-}
-
-static void
-nvfx_blend_state_bind(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->blend = hwcso;
- nvfx->dirty |= NVFX_NEW_BLEND;
-}
-
-static void
-nvfx_blend_state_delete(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_blend_state *bso = hwcso;
-
- FREE(bso);
-}
-
-static void *
-nvfx_rasterizer_state_create(struct pipe_context *pipe,
- const struct pipe_rasterizer_state *cso)
-{
- struct nvfx_rasterizer_state *rsso = CALLOC(1, sizeof(*rsso));
- struct nouveau_statebuf_builder sb = sb_init(rsso->sb);
-
- /*XXX: ignored:
- * point_smooth -nohw
- * multisample
- * sprite_coord_origin
- */
-
- sb_method(sb, NV30_3D_SHADE_MODEL, 1);
- sb_data(sb, cso->flatshade ? NV30_3D_SHADE_MODEL_FLAT :
- NV30_3D_SHADE_MODEL_SMOOTH);
-
- sb_method(sb, NV30_3D_VERTEX_TWO_SIDE_ENABLE, 1);
- sb_data(sb, cso->light_twoside);
-
- sb_method(sb, NV30_3D_LINE_WIDTH, 2);
- sb_data(sb, (unsigned char)(cso->line_width * 8.0) & 0xff);
- sb_data(sb, cso->line_smooth ? 1 : 0);
- sb_method(sb, NV30_3D_LINE_STIPPLE_ENABLE, 2);
- sb_data(sb, cso->line_stipple_enable ? 1 : 0);
- sb_data(sb, (cso->line_stipple_pattern << 16) |
- cso->line_stipple_factor);
-
- sb_method(sb, NV30_3D_POINT_SIZE, 1);
- sb_data(sb, fui(cso->point_size));
-
- sb_method(sb, NV30_3D_POLYGON_MODE_FRONT, 6);
- sb_data(sb, nvgl_polygon_mode(cso->fill_front));
- sb_data(sb, nvgl_polygon_mode(cso->fill_back));
- switch (cso->cull_face) {
- case PIPE_FACE_FRONT:
- sb_data(sb, NV30_3D_CULL_FACE_FRONT);
- break;
- case PIPE_FACE_BACK:
- sb_data(sb, NV30_3D_CULL_FACE_BACK);
- break;
- case PIPE_FACE_FRONT_AND_BACK:
- sb_data(sb, NV30_3D_CULL_FACE_FRONT_AND_BACK);
- break;
- default:
- sb_data(sb, NV30_3D_CULL_FACE_BACK);
- break;
- }
- if (cso->front_ccw) {
- sb_data(sb, NV30_3D_FRONT_FACE_CCW);
- } else {
- sb_data(sb, NV30_3D_FRONT_FACE_CW);
- }
- sb_data(sb, cso->poly_smooth ? 1 : 0);
- sb_data(sb, (cso->cull_face != PIPE_FACE_NONE) ? 1 : 0);
-
- sb_method(sb, NV30_3D_POLYGON_STIPPLE_ENABLE, 1);
- sb_data(sb, cso->poly_stipple_enable ? 1 : 0);
-
- sb_method(sb, NV30_3D_POLYGON_OFFSET_POINT_ENABLE, 3);
- sb_data(sb, cso->offset_point);
- sb_data(sb, cso->offset_line);
- sb_data(sb, cso->offset_tri);
-
- if (cso->offset_point || cso->offset_line || cso->offset_tri) {
- sb_method(sb, NV30_3D_POLYGON_OFFSET_FACTOR, 2);
- sb_data(sb, fui(cso->offset_scale));
- sb_data(sb, fui(cso->offset_units * 2));
- }
-
- sb_method(sb, NV30_3D_FLATSHADE_FIRST, 1);
- sb_data(sb, cso->flatshade_first);
-
- rsso->pipe = *cso;
- rsso->sb_len = sb_len(sb, rsso->sb);
- return (void *)rsso;
-}
-
-static void
-nvfx_rasterizer_state_bind(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- if(nvfx->rasterizer && hwcso)
- {
- if(!nvfx->rasterizer || ((struct nvfx_rasterizer_state*)hwcso)->pipe.scissor
- != nvfx->rasterizer->pipe.scissor)
- {
- nvfx->dirty |= NVFX_NEW_SCISSOR;
- nvfx->draw_dirty |= NVFX_NEW_SCISSOR;
- }
-
- if(((struct nvfx_rasterizer_state*)hwcso)->pipe.point_quad_rasterization != nvfx->rasterizer->pipe.point_quad_rasterization
- || ((struct nvfx_rasterizer_state*)hwcso)->pipe.sprite_coord_enable != nvfx->rasterizer->pipe.sprite_coord_enable
- || ((struct nvfx_rasterizer_state*)hwcso)->pipe.sprite_coord_mode != nvfx->rasterizer->pipe.sprite_coord_mode)
- {
- nvfx->dirty |= NVFX_NEW_SPRITE;
- }
- }
-
- nvfx->rasterizer = hwcso;
- nvfx->dirty |= NVFX_NEW_RAST;
- nvfx->draw_dirty |= NVFX_NEW_RAST;
-}
-
-static void
-nvfx_rasterizer_state_delete(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_rasterizer_state *rsso = hwcso;
-
- FREE(rsso);
-}
-
-static void *
-nvfx_depth_stencil_alpha_state_create(struct pipe_context *pipe,
- const struct pipe_depth_stencil_alpha_state *cso)
-{
- struct nvfx_zsa_state *zsaso = CALLOC(1, sizeof(*zsaso));
- struct nouveau_statebuf_builder sb = sb_init(zsaso->sb);
-
- sb_method(sb, NV30_3D_DEPTH_FUNC, 1);
- sb_data (sb, nvgl_comparison_op(cso->depth.func));
-
- sb_method(sb, NV30_3D_ALPHA_FUNC_ENABLE, 3);
- sb_data (sb, cso->alpha.enabled ? 1 : 0);
- sb_data (sb, nvgl_comparison_op(cso->alpha.func));
- sb_data (sb, float_to_ubyte(cso->alpha.ref_value));
-
- if (cso->stencil[0].enabled) {
- sb_method(sb, NV30_3D_STENCIL_ENABLE(0), 3);
- sb_data (sb, cso->stencil[0].enabled ? 1 : 0);
- sb_data (sb, cso->stencil[0].writemask);
- sb_data (sb, nvgl_comparison_op(cso->stencil[0].func));
- sb_method(sb, NV30_3D_STENCIL_FUNC_MASK(0), 4);
- sb_data (sb, cso->stencil[0].valuemask);
- sb_data (sb, nvgl_stencil_op(cso->stencil[0].fail_op));
- sb_data (sb, nvgl_stencil_op(cso->stencil[0].zfail_op));
- sb_data (sb, nvgl_stencil_op(cso->stencil[0].zpass_op));
- } else {
- sb_method(sb, NV30_3D_STENCIL_ENABLE(0), 1);
- sb_data (sb, 0);
- }
-
- if (cso->stencil[1].enabled) {
- sb_method(sb, NV30_3D_STENCIL_ENABLE(1), 3);
- sb_data (sb, cso->stencil[1].enabled ? 1 : 0);
- sb_data (sb, cso->stencil[1].writemask);
- sb_data (sb, nvgl_comparison_op(cso->stencil[1].func));
- sb_method(sb, NV30_3D_STENCIL_FUNC_MASK(1), 4);
- sb_data (sb, cso->stencil[1].valuemask);
- sb_data (sb, nvgl_stencil_op(cso->stencil[1].fail_op));
- sb_data (sb, nvgl_stencil_op(cso->stencil[1].zfail_op));
- sb_data (sb, nvgl_stencil_op(cso->stencil[1].zpass_op));
- } else {
- sb_method(sb, NV30_3D_STENCIL_ENABLE(1), 1);
- sb_data (sb, 0);
- }
-
- zsaso->pipe = *cso;
- zsaso->sb_len = sb_len(sb, zsaso->sb);
- return (void *)zsaso;
-}
-
-static void
-nvfx_depth_stencil_alpha_state_bind(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->zsa = hwcso;
- nvfx->dirty |= NVFX_NEW_ZSA;
-}
-
-static void
-nvfx_depth_stencil_alpha_state_delete(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_zsa_state *zsaso = hwcso;
-
- FREE(zsaso);
-}
-
-static void
-nvfx_set_blend_color(struct pipe_context *pipe,
- const struct pipe_blend_color *bcol)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->blend_colour = *bcol;
- nvfx->dirty |= NVFX_NEW_BCOL;
-}
-
-static void
-nvfx_set_stencil_ref(struct pipe_context *pipe,
- const struct pipe_stencil_ref *sr)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->stencil_ref = *sr;
- nvfx->dirty |= NVFX_NEW_SR;
-}
-
-static void
-nvfx_set_clip_state(struct pipe_context *pipe,
- const struct pipe_clip_state *clip)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->clip = *clip;
- nvfx->dirty |= NVFX_NEW_UCP;
- nvfx->draw_dirty |= NVFX_NEW_UCP;
-}
-
-static void
-nvfx_set_sample_mask(struct pipe_context *pipe,
- unsigned sample_mask)
-{
-}
-
-static void
-nvfx_set_constant_buffer(struct pipe_context *pipe, uint shader, uint index,
- struct pipe_resource *buf )
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- pipe_resource_reference(&nvfx->constbuf[shader], buf);
- nvfx->constbuf_nr[shader] = buf ? (buf->width0 / (4 * sizeof(float))) : 0;
-
- if (shader == PIPE_SHADER_VERTEX) {
- nvfx->dirty |= NVFX_NEW_VERTCONST;
- } else
- if (shader == PIPE_SHADER_FRAGMENT) {
- nvfx->dirty |= NVFX_NEW_FRAGCONST;
- }
-}
-
-static void
-nvfx_set_framebuffer_state(struct pipe_context *pipe,
- const struct pipe_framebuffer_state *fb)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- if(fb)
- util_copy_framebuffer_state(&nvfx->framebuffer, fb);
- else
- util_unreference_framebuffer_state(&nvfx->framebuffer);
- nvfx->dirty |= NVFX_NEW_FB;
-}
-
-static void
-nvfx_set_polygon_stipple(struct pipe_context *pipe,
- const struct pipe_poly_stipple *stipple)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- memcpy(nvfx->stipple, stipple->stipple, 4 * 32);
- nvfx->dirty |= NVFX_NEW_STIPPLE;
-}
-
-static void
-nvfx_set_scissor_state(struct pipe_context *pipe,
- const struct pipe_scissor_state *s)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->scissor = *s;
- nvfx->dirty |= NVFX_NEW_SCISSOR;
-}
-
-static void
-nvfx_set_viewport_state(struct pipe_context *pipe,
- const struct pipe_viewport_state *vpt)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->viewport = *vpt;
- nvfx->dirty |= NVFX_NEW_VIEWPORT;
- nvfx->draw_dirty |= NVFX_NEW_VIEWPORT;
-}
-
-void
-nvfx_init_state_functions(struct nvfx_context *nvfx)
-{
- nvfx->pipe.create_blend_state = nvfx_blend_state_create;
- nvfx->pipe.bind_blend_state = nvfx_blend_state_bind;
- nvfx->pipe.delete_blend_state = nvfx_blend_state_delete;
-
- nvfx->pipe.create_rasterizer_state = nvfx_rasterizer_state_create;
- nvfx->pipe.bind_rasterizer_state = nvfx_rasterizer_state_bind;
- nvfx->pipe.delete_rasterizer_state = nvfx_rasterizer_state_delete;
-
- nvfx->pipe.create_depth_stencil_alpha_state =
- nvfx_depth_stencil_alpha_state_create;
- nvfx->pipe.bind_depth_stencil_alpha_state =
- nvfx_depth_stencil_alpha_state_bind;
- nvfx->pipe.delete_depth_stencil_alpha_state =
- nvfx_depth_stencil_alpha_state_delete;
-
- nvfx->pipe.set_blend_color = nvfx_set_blend_color;
- nvfx->pipe.set_stencil_ref = nvfx_set_stencil_ref;
- nvfx->pipe.set_clip_state = nvfx_set_clip_state;
- nvfx->pipe.set_sample_mask = nvfx_set_sample_mask;
- nvfx->pipe.set_constant_buffer = nvfx_set_constant_buffer;
- nvfx->pipe.set_framebuffer_state = nvfx_set_framebuffer_state;
- nvfx->pipe.set_polygon_stipple = nvfx_set_polygon_stipple;
- nvfx->pipe.set_scissor_state = nvfx_set_scissor_state;
- nvfx->pipe.set_viewport_state = nvfx_set_viewport_state;
-}
+++ /dev/null
-#ifndef __NVFX_STATE_H__
-#define __NVFX_STATE_H__
-
-#include "pipe/p_state.h"
-#include "pipe/p_video_state.h"
-#include "tgsi/tgsi_scan.h"
-#include "nouveau/nouveau_statebuf.h"
-#include "util/u_dynarray.h"
-#include "util/u_linkage.h"
-
-struct nvfx_vertex_program_exec {
- uint32_t data[4];
-};
-
-struct nvfx_vertex_program_data {
- int index; /* immediates == -1 */
- float value[4];
-};
-
-struct nvfx_vertex_program {
- unsigned long long id;
-
- struct nvfx_vertex_program_exec *insns;
- unsigned nr_insns;
- struct nvfx_vertex_program_data *consts;
- unsigned nr_consts;
-
- char generic_to_fp_input[256];
- int sprite_fp_input;
-
- struct nouveau_resource *exec;
- unsigned exec_start;
- struct nouveau_resource *data;
- unsigned data_start;
- unsigned data_start_min;
-
- uint32_t ir;
- uint32_t or;
- int clip_nr;
-
- struct util_dynarray branch_relocs;
- struct util_dynarray const_relocs;
-};
-
-#define NVFX_VP_FAILED ((struct nvfx_vertex_program*)-1)
-
-struct nvfx_pipe_vertex_program {
- struct pipe_shader_state pipe;
- struct tgsi_shader_info info;
-
- unsigned draw_elements;
- boolean draw_no_elements;
- struct draw_vertex_shader *draw_vs;
- struct nvfx_vertex_program* draw_vp;
-
- struct nvfx_vertex_program* vp;
-};
-
-struct nvfx_fragment_program_data {
- unsigned offset;
- unsigned index;
-};
-
-struct nvfx_fragment_program_bo {
- struct nvfx_fragment_program_bo* next;
- struct nouveau_bo* bo;
- unsigned char* slots;
- char insn[] __attribute__((aligned(16)));
-};
-
-struct nvfx_fragment_program {
- unsigned samplers;
- unsigned point_sprite_control;
- unsigned or;
- unsigned coord_conventions;
-
- uint32_t *insn;
- int insn_len;
-
- struct nvfx_fragment_program_data *consts;
- unsigned nr_consts;
-
- /* the slot at num_slots is for the sprite coordinate, if any */
- unsigned num_slots; /* how many input semantics? */
- unsigned char slot_to_generic[10]; /* semantics */
- unsigned char slot_to_fp_input[11]; /* current assignment of slots for each used semantic */
- struct util_dynarray slot_relocations[11];
-
- /* This is reset to progs on any relocation update, and decreases every time we
- * move to a new prog due to a constant update
- * When this is the same as progs, applying relocations is no longer necessary.
- */
- unsigned progs_left_with_obsolete_slot_assignments;
-
- unsigned long long last_vp_id;
- unsigned last_sprite_coord_enable;
-
- uint32_t fp_control;
-
- unsigned bo_prog_idx;
- unsigned prog_size;
- unsigned progs_per_bo;
- unsigned progs;
-
- struct nvfx_fragment_program_bo* fpbo;
-};
-
-struct nvfx_pipe_fragment_program {
- struct pipe_shader_state pipe;
- struct tgsi_shader_info info;
-
- struct nvfx_fragment_program* fps[2];
-};
-
-#endif
+++ /dev/null
-#include "nvfx_context.h"
-#include "nvfx_state.h"
-#include "nvfx_resource.h"
-#include "draw/draw_context.h"
-
-void
-nvfx_state_viewport_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct pipe_viewport_state *vpt = &nvfx->viewport;
-
- if(nvfx->render_mode == HW) {
- BEGIN_RING(chan, eng3d, NV30_3D_VIEWPORT_TRANSLATE_X, 8);
- OUT_RINGf(chan, vpt->translate[0]);
- OUT_RINGf(chan, vpt->translate[1]);
- OUT_RINGf(chan, vpt->translate[2]);
- OUT_RINGf(chan, vpt->translate[3]);
- OUT_RINGf(chan, vpt->scale[0]);
- OUT_RINGf(chan, vpt->scale[1]);
- OUT_RINGf(chan, vpt->scale[2]);
- OUT_RINGf(chan, vpt->scale[3]);
- BEGIN_RING(chan, eng3d, 0x1d78, 1);
- OUT_RING(chan, 1);
- } else {
- BEGIN_RING(chan, eng3d, NV30_3D_VIEWPORT_TRANSLATE_X, 8);
- OUT_RINGf(chan, 0.0f);
- OUT_RINGf(chan, 0.0f);
- OUT_RINGf(chan, 0.0f);
- OUT_RINGf(chan, 0.0f);
- OUT_RINGf(chan, 1.0f);
- OUT_RINGf(chan, 1.0f);
- OUT_RINGf(chan, 1.0f);
- OUT_RINGf(chan, 1.0f);
- BEGIN_RING(chan, eng3d, 0x1d78, 1);
- OUT_RING(chan, nvfx->is_nv4x ? 0x110 : 1);
- }
-}
-
-void
-nvfx_state_scissor_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct pipe_rasterizer_state *rast = &nvfx->rasterizer->pipe;
- struct pipe_scissor_state *s = &nvfx->scissor;
-
- if ((rast->scissor == 0 && nvfx->state.scissor_enabled == 0))
- return;
- nvfx->state.scissor_enabled = rast->scissor;
-
- BEGIN_RING(chan, eng3d, NV30_3D_SCISSOR_HORIZ, 2);
- if (nvfx->state.scissor_enabled) {
- OUT_RING(chan, ((s->maxx - s->minx) << 16) | s->minx);
- OUT_RING(chan, ((s->maxy - s->miny) << 16) | s->miny);
- } else {
- OUT_RING(chan, 4096 << 16);
- OUT_RING(chan, 4096 << 16);
- }
-}
-
-void
-nvfx_state_sr_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct pipe_stencil_ref *sr = &nvfx->stencil_ref;
-
- BEGIN_RING(chan, eng3d, NV30_3D_STENCIL_FUNC_REF(0), 1);
- OUT_RING(chan, sr->ref_value[0]);
- BEGIN_RING(chan, eng3d, NV30_3D_STENCIL_FUNC_REF(1), 1);
- OUT_RING(chan, sr->ref_value[1]);
-}
-
-void
-nvfx_state_blend_colour_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- struct pipe_blend_color *bcol = &nvfx->blend_colour;
-
- BEGIN_RING(chan, eng3d, NV30_3D_BLEND_COLOR, 1);
- OUT_RING(chan, ((float_to_ubyte(bcol->color[3]) << 24) |
- (float_to_ubyte(bcol->color[0]) << 16) |
- (float_to_ubyte(bcol->color[1]) << 8) |
- (float_to_ubyte(bcol->color[2]) << 0)));
-}
-
-void
-nvfx_state_stipple_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
-
- BEGIN_RING(chan, eng3d, NV30_3D_POLYGON_STIPPLE_PATTERN(0), 32);
- OUT_RINGp(chan, nvfx->stipple, 32);
-}
-
-static void
-nvfx_coord_conventions_validate(struct nvfx_context* nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- unsigned value = nvfx->hw_fragprog->coord_conventions;
- if(value & NV30_3D_COORD_CONVENTIONS_ORIGIN_INVERTED)
- value |= nvfx->framebuffer.height << NV30_3D_COORD_CONVENTIONS_HEIGHT__SHIFT;
-
- BEGIN_RING(chan, eng3d, NV30_3D_COORD_CONVENTIONS, 1);
- OUT_RING(chan, value);
-}
-
-static void
-nvfx_ucp_validate(struct nvfx_context* nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- unsigned enables[] =
- {
- NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE0,
- NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE1,
- NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE2,
- NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE3,
- NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE4,
- NV30_3D_VP_CLIP_PLANES_ENABLE_PLANE5
- };
- unsigned i, enable = 0, nr = 0;
-
- for (i = 0; i < 6; i++) {
- if (nvfx->rasterizer->pipe.clip_plane_enable & (1 << i)) {
- enable |= enables[i];
- nr = i+1;
- }
- }
-
- if(!nvfx->use_vp_clipping)
- {
- BEGIN_RING(chan, eng3d, NV30_3D_VP_CLIP_PLANES_ENABLE, 1);
- OUT_RING(chan, 0);
-
- BEGIN_RING(chan, eng3d, NV30_3D_VP_CLIP_PLANE(0, 0),
- nr * 4);
- OUT_RINGp(chan, &nvfx->clip.ucp[0][0], nr * 4);
- }
-
- BEGIN_RING(chan, eng3d, NV30_3D_VP_CLIP_PLANES_ENABLE, 1);
- OUT_RING(chan, enable);
-}
-
-static void
-nvfx_vertprog_ucp_validate(struct nvfx_context* nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- unsigned i;
- struct nvfx_vertex_program* vp = nvfx->hw_vertprog;
- unsigned enable = nvfx->rasterizer->pipe.clip_plane_enable;
- unsigned nr = util_bitcount(enable);
-
- if(nr != vp->clip_nr)
- {
- unsigned idx;
-
- /* remove last instruction bit */
- if(vp->clip_nr >= 0)
- {
- idx = vp->nr_insns - 7 + vp->clip_nr;
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_FROM_ID, 1);
- OUT_RING(chan, vp->exec->start + idx);
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_INST(0), 4);
- OUT_RINGp (chan, vp->insns[idx].data, 4);
- }
-
- /* set last instruction bit */
- idx = vp->nr_insns - 7 + nr;
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_FROM_ID, 1);
- OUT_RING(chan, vp->exec->start + idx);
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_INST(0), 4);
- OUT_RINGp(chan, vp->insns[idx].data, 3);
- OUT_RING(chan, vp->insns[idx].data[3] | 1);
- vp->clip_nr = nr;
- }
-
- // TODO: only do this for the ones changed
- for(i = 0; enable; ++i)
- {
- unsigned index = ffs(enable) - 1;
- enable &= ~(1 << index);
-
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_CONST_ID, 5);
- OUT_RING(chan, vp->data->start + i);
- OUT_RINGp (chan, nvfx->clip.ucp[index], 4);
- }
-}
-
-static boolean
-nvfx_state_validate_common(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- unsigned dirty;
- unsigned still_dirty = 0;
- boolean flush_tex_cache = FALSE;
-
- if(nvfx != nvfx->screen->cur_ctx)
- {
- nvfx->dirty = ~0;
- nvfx->hw_vtxelt_nr = 16;
- nvfx->hw_pointsprite_control = -1;
- nvfx->hw_vp_output = -1;
- nvfx->screen->cur_ctx = nvfx;
- nvfx->relocs_needed = NVFX_RELOCATE_ALL;
- }
-
- dirty = nvfx->dirty;
-
- if(nvfx->render_mode == HW)
- {
- if(dirty & (NVFX_NEW_VERTPROG | NVFX_NEW_VERTCONST))
- {
- if(!nvfx_vertprog_validate(nvfx))
- return FALSE;
- }
-
- if(dirty & NVFX_NEW_ARRAYS)
- {
- if(!nvfx_vbo_validate(nvfx))
- return FALSE;
- }
-
- if(dirty & NVFX_NEW_INDEX)
- {
- if(nvfx->use_index_buffer)
- nvfx_idxbuf_validate(nvfx);
- else
- still_dirty = NVFX_NEW_INDEX;
- }
- }
- else
- {
- if(dirty & NVFX_NEW_VERTPROG) {
- assert(nvfx_vertprog_validate(nvfx));
- nvfx_vbo_swtnl_validate(nvfx);
- }
- }
-
- if(dirty & NVFX_NEW_SAMPLER) {
- /* XXX: we take the big hammer here, I have no idea why this is needed
- to make this work properly */
- nvfx->dirty &= ~NVFX_NEW_SAMPLER;
- nvfx_fragtex_validate(nvfx);
-
- // TODO: only set this if really necessary
- flush_tex_cache = TRUE;
- }
-
- if(dirty & NVFX_NEW_RAST)
- sb_emit(chan, nvfx->rasterizer->sb, nvfx->rasterizer->sb_len);
-
- if(dirty & NVFX_NEW_SCISSOR)
- nvfx_state_scissor_validate(nvfx);
-
- if(dirty & NVFX_NEW_STIPPLE)
- nvfx_state_stipple_validate(nvfx);
-
- if(nvfx->dirty & (NVFX_NEW_UCP | NVFX_NEW_RAST))
- nvfx_ucp_validate(nvfx);
-
- if(nvfx->use_vp_clipping && (nvfx->dirty &
- (NVFX_NEW_UCP | NVFX_NEW_VERTPROG |
- NVFX_NEW_RAST)))
- nvfx_vertprog_ucp_validate(nvfx);
-
- if(dirty & (NVFX_NEW_FRAGPROG | NVFX_NEW_FRAGCONST |
- NVFX_NEW_VERTPROG | NVFX_NEW_SPRITE))
- {
- nvfx_fragprog_validate(nvfx);
- if(dirty & NVFX_NEW_FRAGPROG)
- flush_tex_cache = TRUE; // TODO: do we need this?
- }
-
- if(nvfx->is_nv4x)
- {
- unsigned vp_output = nvfx->hw_vertprog->or | nvfx->hw_fragprog->or;
- vp_output |= ((1 << (nvfx->rasterizer->pipe.clip_plane_enable & 63)) - 1) << 6;
-
- if(vp_output != nvfx->hw_vp_output)
- {
- BEGIN_RING(chan, eng3d, NV40_3D_VP_RESULT_EN, 1);
- OUT_RING(chan, vp_output);
- nvfx->hw_vp_output = vp_output;
- }
- }
-
- if(dirty & NVFX_NEW_FB)
- nvfx_framebuffer_validate(nvfx);
-
- if(dirty & NVFX_NEW_BLEND)
- sb_emit(chan, nvfx->blend->sb, nvfx->blend->sb_len);
-
- if(dirty & NVFX_NEW_BCOL)
- nvfx_state_blend_colour_validate(nvfx);
-
- if(dirty & NVFX_NEW_ZSA)
- sb_emit(chan, nvfx->zsa->sb, nvfx->zsa->sb_len);
-
- if(dirty & NVFX_NEW_SR)
- nvfx_state_sr_validate(nvfx);
-
- /* XXX: nv3x needs viewport revalidation after RAST or ZSA change */
- if(dirty & (NVFX_NEW_VIEWPORT | NVFX_NEW_RAST | NVFX_NEW_ZSA))
- {
- nvfx_state_viewport_validate(nvfx);
- }
-
- if(dirty & (NVFX_NEW_ZSA | NVFX_NEW_FB))
- {
- BEGIN_RING(chan, eng3d, NV30_3D_DEPTH_WRITE_ENABLE, 2);
- OUT_RING(chan, nvfx->framebuffer.zsbuf &&
- nvfx->zsa->pipe.depth.writemask);
- OUT_RING(chan, nvfx->framebuffer.zsbuf &&
- nvfx->zsa->pipe.depth.enabled);
- }
-
- if(dirty & (NVFX_NEW_FRAGPROG | NVFX_NEW_FB))
- nvfx_coord_conventions_validate(nvfx);
-
- if(flush_tex_cache && nvfx->is_nv4x)
- {
- BEGIN_RING(chan, eng3d, NV40_3D_TEX_CACHE_CTL, 1);
- OUT_RING(chan, 2);
- BEGIN_RING(chan, eng3d, NV40_3D_TEX_CACHE_CTL, 1);
- OUT_RING(chan, 1);
- }
-
- nvfx->dirty = dirty & still_dirty;
-
- return TRUE;
-}
-
-inline void
-nvfx_state_relocate(struct nvfx_context *nvfx, unsigned relocs)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- /* we need to ensure there is enough space to output relocations in one go */
- const unsigned max_relocs = 0
- + 16 /* vertex buffers, incl. dma flag */
- + 2 /* index buffer plus format+dma flag */
- + 2 * 5 /* 4 cbufs + zsbuf, plus dma objects */
- + 2 * 16 /* fragment textures plus format+dma flag */
- + 2 * 4 /* vertex textures plus format+dma flag */
- + 1 /* fragprog incl dma flag */
- ;
-
- MARK_RING(chan, max_relocs * 2, max_relocs * 2);
-
- if(relocs & NVFX_RELOCATE_FRAMEBUFFER)
- nvfx_framebuffer_relocate(nvfx);
- if(relocs & NVFX_RELOCATE_FRAGTEX)
- nvfx_fragtex_relocate(nvfx);
- if(relocs & NVFX_RELOCATE_FRAGPROG)
- nvfx_fragprog_relocate(nvfx);
- if(relocs & NVFX_RELOCATE_VTXBUF)
- nvfx_vbo_relocate(nvfx);
- if(relocs & NVFX_RELOCATE_IDXBUF)
- nvfx_idxbuf_relocate(nvfx);
-}
-
-boolean
-nvfx_state_validate(struct nvfx_context *nvfx)
-{
- if (nvfx->render_mode != HW) {
- /* Don't even bother trying to go back to hw if none
- * of the states that caused swtnl previously have changed.
- */
- if ((nvfx->fallback_swtnl & nvfx->dirty)
- != nvfx->fallback_swtnl)
- return FALSE;
-
- /* Attempt to go to hwtnl again */
- nvfx->dirty |= (NVFX_NEW_VIEWPORT |
- NVFX_NEW_VERTPROG |
- NVFX_NEW_ARRAYS);
- nvfx->render_mode = HW;
- }
-
- if(!nvfx_state_validate_common(nvfx))
- return FALSE;
-
- return TRUE;
-}
-
-boolean
-nvfx_state_validate_swtnl(struct nvfx_context *nvfx)
-{
- struct draw_context *draw = nvfx->draw;
-
- /* Setup for swtnl */
- if (nvfx->render_mode == HW) {
- static boolean warned = FALSE;
- if(!warned) {
- NOUVEAU_ERR("hw->swtnl 0x%08x\n", nvfx->fallback_swtnl);
- warned = TRUE;
- }
- nvfx->pipe.flush(&nvfx->pipe, NULL);
- nvfx->dirty |= (NVFX_NEW_VIEWPORT |
- NVFX_NEW_VERTPROG |
- NVFX_NEW_ARRAYS);
- nvfx->render_mode = SWTNL;
- }
-
- if (nvfx->draw_dirty & NVFX_NEW_VERTPROG) {
- if(!nvfx->vertprog->draw_vs)
- nvfx->vertprog->draw_vs = draw_create_vertex_shader(draw, &nvfx->vertprog->pipe);
- draw_bind_vertex_shader(draw, nvfx->vertprog->draw_vs);
- }
-
- if (nvfx->draw_dirty & NVFX_NEW_RAST)
- draw_set_rasterizer_state(draw, &nvfx->rasterizer->pipe,
- nvfx->rasterizer);
-
- if (nvfx->draw_dirty & NVFX_NEW_UCP)
- draw_set_clip_state(draw, &nvfx->clip);
-
- if (nvfx->draw_dirty & NVFX_NEW_VIEWPORT)
- draw_set_viewport_state(draw, &nvfx->viewport);
-
- if (nvfx->draw_dirty & NVFX_NEW_ARRAYS) {
- draw_set_vertex_buffers(draw, nvfx->vtxbuf_nr, nvfx->vtxbuf);
- draw_set_vertex_elements(draw, nvfx->vtxelt->num_elements, nvfx->vtxelt->pipe);
- }
-
- if (nvfx->draw_dirty & NVFX_NEW_INDEX)
- draw_set_index_buffer(draw, &nvfx->idxbuf);
-
- nvfx_state_validate_common(nvfx);
-
- nvfx->draw_dirty = 0;
- return TRUE;
-}
+++ /dev/null
-#include "nvfx_context.h"
-#include "nvfx_resource.h"
-#include "util/u_format.h"
-
-static inline boolean
-nvfx_surface_linear_target(struct pipe_surface* surf)
-{
- return !!((struct nvfx_miptree*)surf->texture)->linear_pitch;
-}
-
-static void
-nvfx_surface_get_render_target(struct pipe_surface* surf,
- struct nvfx_render_target* target)
-{
- struct nvfx_surface* ns = (struct nvfx_surface*)surf;
-
- target->bo = ((struct nvfx_miptree*)surf->texture)->base.bo;
- target->offset = ns->offset;
- target->pitch = align(ns->pitch, 64);
- assert(target->pitch);
-}
-
-void
-nvfx_framebuffer_validate(struct nvfx_context *nvfx)
-{
- struct pipe_framebuffer_state *fb = &nvfx->framebuffer;
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- uint32_t rt_enable, rt_format;
- int i;
- unsigned rt_flags = NOUVEAU_BO_RDWR | NOUVEAU_BO_VRAM;
- unsigned w = fb->width;
- unsigned h = fb->height;
- int all_swizzled =1 , cb_format = 0;
-
- /* do some sanity checks on the render target state and check if the targets
- * are swizzled
- */
- nvfx->is_nv4x ? assert(fb->nr_cbufs <= 4) : assert(fb->nr_cbufs <= 1);
- if(fb->nr_cbufs && fb->zsbuf)
- assert(util_format_get_blocksize(fb->cbufs[0]->format) ==
- util_format_get_blocksize(fb->zsbuf->format));
-
- for(i = 0; i < fb->nr_cbufs; i++) {
- if(cb_format)
- assert(cb_format == fb->cbufs[i]->format);
- else
- cb_format = fb->cbufs[i]->format;
-
- if(nvfx_surface_linear_target(fb->cbufs[i]))
- all_swizzled = 0;
- }
-
- if(fb->zsbuf && nvfx_surface_linear_target(fb->zsbuf))
- all_swizzled = 0;
-
- rt_enable = (NV30_3D_RT_ENABLE_COLOR0 << fb->nr_cbufs) - 1;
- if(rt_enable & (NV30_3D_RT_ENABLE_COLOR1 |
- NV40_3D_RT_ENABLE_COLOR2 | NV40_3D_RT_ENABLE_COLOR3))
- rt_enable |= NV30_3D_RT_ENABLE_MRT;
-
- for(i = 0; i < fb->nr_cbufs; i++)
- nvfx_surface_get_render_target(fb->cbufs[i], &nvfx->hw_rt[i]);
-
- for(; i < 4; ++i)
- nvfx->hw_rt[i].bo = NULL;
-
- nvfx->hw_zeta.bo = NULL;
-
- if(fb->zsbuf) {
- nvfx_surface_get_render_target(fb->zsbuf, &nvfx->hw_zeta);
- assert(util_format_get_stride(fb->zsbuf->format, fb->width) <=
- nvfx->hw_zeta.pitch);
- }
-
- if(all_swizzled) {
- /* hardware rounds down render target offset to 64 bytes,
- * but surfaces with a size of 2x2 pixel (16bpp) or 1x1 pixel (32bpp)
- * have an unaligned start address, for those two important square
- * formats we can hack around this limitation by adjusting the viewport
- */
- if(nvfx->hw_rt[0].offset & 63) {
- int delta = nvfx->hw_rt[0].offset & 63;
- h = 2;
- w = 16;
- nvfx->viewport.translate[0] += delta /
- (util_format_get_blocksize(fb->cbufs[0]->format) * 2);
- nvfx->dirty |= NVFX_NEW_VIEWPORT;
- }
-
- rt_format = NV30_3D_RT_FORMAT_TYPE_SWIZZLED |
- (util_logbase2(w) << NV30_3D_RT_FORMAT_LOG2_WIDTH__SHIFT) |
- (util_logbase2(h) << NV30_3D_RT_FORMAT_LOG2_HEIGHT__SHIFT);
- } else {
- rt_format = NV30_3D_RT_FORMAT_TYPE_LINEAR;
- }
-
- if(fb->nr_cbufs > 0) {
- switch (fb->cbufs[0]->format) {
- case PIPE_FORMAT_B8G8R8X8_UNORM:
- rt_format |= NV30_3D_RT_FORMAT_COLOR_X8R8G8B8;
- break;
- case PIPE_FORMAT_B8G8R8A8_UNORM:
- case 0:
- rt_format |= NV30_3D_RT_FORMAT_COLOR_A8R8G8B8;
- break;
- case PIPE_FORMAT_R8G8B8X8_UNORM:
- rt_format |= NV30_3D_RT_FORMAT_COLOR_X8B8G8R8;
- break;
- case PIPE_FORMAT_R8G8B8A8_UNORM:
- rt_format |= NV30_3D_RT_FORMAT_COLOR_A8B8G8R8;
- break;
- case PIPE_FORMAT_B5G6R5_UNORM:
- rt_format |= NV30_3D_RT_FORMAT_COLOR_R5G6B5;
- break;
- case PIPE_FORMAT_R32G32B32A32_FLOAT:
- rt_format |= NV30_3D_RT_FORMAT_COLOR_A32B32G32R32_FLOAT;
- break;
- case PIPE_FORMAT_R16G16B16A16_FLOAT:
- rt_format |= NV30_3D_RT_FORMAT_COLOR_A16B16G16R16_FLOAT;
- break;
- default:
- assert(0);
- }
- } else if(fb->zsbuf && util_format_get_blocksize(fb->zsbuf->format) == 2)
- rt_format |= NV30_3D_RT_FORMAT_COLOR_R5G6B5;
- else
- rt_format |= NV30_3D_RT_FORMAT_COLOR_A8R8G8B8;
-
- if(fb->zsbuf) {
- switch (fb->zsbuf->format) {
- case PIPE_FORMAT_Z16_UNORM:
- rt_format |= NV30_3D_RT_FORMAT_ZETA_Z16;
- break;
- case PIPE_FORMAT_S8_UINT_Z24_UNORM:
- case PIPE_FORMAT_X8Z24_UNORM:
- case 0:
- rt_format |= NV30_3D_RT_FORMAT_ZETA_Z24S8;
- break;
- default:
- assert(0);
- }
- } else if(fb->nr_cbufs && util_format_get_blocksize(fb->cbufs[0]->format) == 2)
- rt_format |= NV30_3D_RT_FORMAT_ZETA_Z16;
- else
- rt_format |= NV30_3D_RT_FORMAT_ZETA_Z24S8;
-
- MARK_RING(chan, 42, 10);
-
- if ((rt_enable & NV30_3D_RT_ENABLE_COLOR0) || fb->zsbuf) {
- struct nvfx_render_target *rt0 = &nvfx->hw_rt[0];
- uint32_t pitch;
-
- if(!(rt_enable & NV30_3D_RT_ENABLE_COLOR0))
- rt0 = &nvfx->hw_zeta;
-
- pitch = rt0->pitch;
-
- if(!nvfx->is_nv4x)
- {
- if (nvfx->hw_zeta.bo)
- pitch |= (nvfx->hw_zeta.pitch << 16);
- else
- pitch |= (pitch << 16);
- }
-
- //printf("rendering to bo %p [%i] at offset %i with pitch %i\n", rt0->bo, rt0->bo->handle, rt0->offset, pitch);
-
- BEGIN_RING(chan, eng3d, NV30_3D_DMA_COLOR0, 1);
- OUT_RELOC(chan, rt0->bo, 0,
- rt_flags | NOUVEAU_BO_OR,
- chan->vram->handle, chan->gart->handle);
- BEGIN_RING(chan, eng3d, NV30_3D_COLOR0_PITCH, 2);
- OUT_RING(chan, pitch);
- OUT_RELOC(chan, rt0->bo,
- rt0->offset, rt_flags | NOUVEAU_BO_LOW,
- 0, 0);
- }
-
- if (rt_enable & NV30_3D_RT_ENABLE_COLOR1) {
- BEGIN_RING(chan, eng3d, NV30_3D_DMA_COLOR1, 1);
- OUT_RELOC(chan, nvfx->hw_rt[1].bo, 0,
- rt_flags | NOUVEAU_BO_OR,
- chan->vram->handle, chan->gart->handle);
- BEGIN_RING(chan, eng3d, NV30_3D_COLOR1_OFFSET, 2);
- OUT_RELOC(chan, nvfx->hw_rt[1].bo,
- nvfx->hw_rt[1].offset, rt_flags | NOUVEAU_BO_LOW,
- 0, 0);
- OUT_RING(chan, nvfx->hw_rt[1].pitch);
- }
-
- if(nvfx->is_nv4x)
- {
- if (rt_enable & NV40_3D_RT_ENABLE_COLOR2) {
- BEGIN_RING(chan, eng3d, NV40_3D_DMA_COLOR2, 1);
- OUT_RELOC(chan, nvfx->hw_rt[2].bo, 0,
- rt_flags | NOUVEAU_BO_OR,
- chan->vram->handle, chan->gart->handle);
- BEGIN_RING(chan, eng3d, NV40_3D_COLOR2_OFFSET, 1);
- OUT_RELOC(chan, nvfx->hw_rt[2].bo,
- nvfx->hw_rt[2].offset, rt_flags | NOUVEAU_BO_LOW,
- 0, 0);
- BEGIN_RING(chan, eng3d, NV40_3D_COLOR2_PITCH, 1);
- OUT_RING(chan, nvfx->hw_rt[2].pitch);
- }
-
- if (rt_enable & NV40_3D_RT_ENABLE_COLOR3) {
- BEGIN_RING(chan, eng3d, NV40_3D_DMA_COLOR3, 1);
- OUT_RELOC(chan, nvfx->hw_rt[3].bo, 0,
- rt_flags | NOUVEAU_BO_OR,
- chan->vram->handle, chan->gart->handle);
- BEGIN_RING(chan, eng3d, NV40_3D_COLOR3_OFFSET, 1);
- OUT_RELOC(chan, nvfx->hw_rt[3].bo,
- nvfx->hw_rt[3].offset, rt_flags | NOUVEAU_BO_LOW,
- 0, 0);
- BEGIN_RING(chan, eng3d, NV40_3D_COLOR3_PITCH, 1);
- OUT_RING(chan, nvfx->hw_rt[3].pitch);
- }
- }
-
- if (fb->zsbuf) {
- BEGIN_RING(chan, eng3d, NV30_3D_DMA_ZETA, 1);
- OUT_RELOC(chan, nvfx->hw_zeta.bo, 0,
- rt_flags | NOUVEAU_BO_OR,
- chan->vram->handle, chan->gart->handle);
- BEGIN_RING(chan, eng3d, NV30_3D_ZETA_OFFSET, 1);
- /* TODO: reverse engineer LMA */
- OUT_RELOC(chan, nvfx->hw_zeta.bo,
- nvfx->hw_zeta.offset, rt_flags | NOUVEAU_BO_LOW, 0, 0);
- if(nvfx->is_nv4x) {
- BEGIN_RING(chan, eng3d, NV40_3D_ZETA_PITCH, 1);
- OUT_RING(chan, nvfx->hw_zeta.pitch);
- }
- }
- else if(nvfx->is_nv4x) {
- BEGIN_RING(chan, eng3d, NV40_3D_ZETA_PITCH, 1);
- OUT_RING(chan, 64);
- }
-
- BEGIN_RING(chan, eng3d, NV30_3D_RT_ENABLE, 1);
- OUT_RING(chan, rt_enable);
- BEGIN_RING(chan, eng3d, NV30_3D_RT_HORIZ, 3);
- OUT_RING(chan, (w << 16) | 0);
- OUT_RING(chan, (h << 16) | 0);
- OUT_RING(chan, rt_format);
- BEGIN_RING(chan, eng3d, NV30_3D_VIEWPORT_HORIZ, 2);
- OUT_RING(chan, (w << 16) | 0);
- OUT_RING(chan, (h << 16) | 0);
- BEGIN_RING(chan, eng3d, NV30_3D_VIEWPORT_CLIP_HORIZ(0), 2);
- OUT_RING(chan, ((w - 1) << 16) | 0);
- OUT_RING(chan, ((h - 1) << 16) | 0);
-
- if(!nvfx->is_nv4x) {
- /* Wonder why this is needed, context should all be set to zero on init */
- /* TODO: we can most likely remove this, after putting it in context init */
- BEGIN_RING(chan, eng3d, NV30_3D_VIEWPORT_TX_ORIGIN, 1);
- OUT_RING(chan, 0);
- }
- nvfx->relocs_needed &=~ NVFX_RELOCATE_FRAMEBUFFER;
-}
-
-void
-nvfx_framebuffer_relocate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel *chan = nvfx->screen->base.channel;
- unsigned rt_flags = NOUVEAU_BO_RDWR | NOUVEAU_BO_VRAM;
- rt_flags |= NOUVEAU_BO_DUMMY;
- MARK_RING(chan, 20, 20);
-
-#define DO_(var, pfx, name) \
- if(var.bo) { \
- OUT_RELOC(chan, var.bo, RING_3D(pfx##_3D_DMA_##name, 1), rt_flags, 0, 0); \
- OUT_RELOC(chan, var.bo, 0, \
- rt_flags | NOUVEAU_BO_OR, \
- chan->vram->handle, chan->gart->handle); \
- OUT_RELOC(chan, var.bo, RING_3D(pfx##_3D_##name##_OFFSET, 1), rt_flags, 0, 0); \
- OUT_RELOC(chan, var.bo, \
- var.offset, rt_flags | NOUVEAU_BO_LOW, \
- 0, 0); \
- }
-
-#define DO(pfx, num) DO_(nvfx->hw_rt[num], pfx, COLOR##num)
- DO(NV30, 0);
- DO(NV30, 1);
- DO(NV40, 2);
- DO(NV40, 3);
-
- DO_(nvfx->hw_zeta, NV30, ZETA);
- nvfx->relocs_needed &=~ NVFX_RELOCATE_FRAMEBUFFER;
-}
+++ /dev/null
-
-/**************************************************************************
- *
- * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
- * All Rights Reserved.
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the
- * "Software"), to deal in the Software without restriction, including
- * without limitation the rights to use, copy, modify, merge, publish,
- * distribute, sub license, and/or sell copies of the Software, and to
- * permit persons to whom the Software is furnished to do so, subject to
- * the following conditions:
- *
- * The above copyright notice and this permission notice (including the
- * next paragraph) shall be included in all copies or substantial portions
- * of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
- * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
- * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
- * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
- * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
- * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
- *
- **************************************************************************/
-
-#include "pipe/p_context.h"
-#include "pipe/p_format.h"
-#include "util/u_format.h"
-#include "util/u_math.h"
-#include "util/u_memory.h"
-#include "util/u_pack_color.h"
-#include "util/u_blitter.h"
-#include "util/u_surface.h"
-
-#include "nouveau/nouveau_winsys.h"
-#include "nouveau/nouveau_screen.h"
-#include "nvfx_context.h"
-#include "nvfx_screen.h"
-#include "nvfx_resource.h"
-#include "nv04_2d.h"
-
-#include <nouveau/nouveau_bo.h>
-
-static INLINE void
-nvfx_region_set_format(struct nv04_region* rgn, enum pipe_format format)
-{
- unsigned bits = util_format_get_blocksizebits(format);
- unsigned shift = 0;
- rgn->one_bits = 0;
-
- switch(bits)
- {
- case 8:
- rgn->bpps = 0;
- break;
- case 16:
- rgn->bpps = 1;
- if(format == PIPE_FORMAT_B5G5R5X1_UNORM)
- rgn->one_bits = 1;
- break;
- case 32:
- rgn->bpps = 2;
- if(format == PIPE_FORMAT_R8G8B8X8_UNORM || format == PIPE_FORMAT_B8G8R8X8_UNORM)
- rgn->one_bits = 8;
- break;
- case 64:
- rgn->bpps = 2;
- shift = 1;
- break;
- case 128:
- rgn->bpps = 2;
- shift = 2;
- break;
- }
-
- if(shift) {
- rgn->x = util_format_get_nblocksx(format, rgn->x) << shift;
- rgn->y = util_format_get_nblocksy(format, rgn->y);
- rgn->w <<= shift;
- }
-}
-
-static INLINE void
-nvfx_region_init_for_surface(struct nv04_region* rgn, struct nvfx_surface* surf, unsigned x, unsigned y, boolean for_write)
-{
- rgn->x = x;
- rgn->y = y;
- rgn->z = 0;
-
- rgn->bo = ((struct nvfx_resource*)surf->base.texture)->bo;
- rgn->offset = surf->offset;
-
- if(surf->base.texture->flags & NOUVEAU_RESOURCE_FLAG_LINEAR)
- rgn->pitch = surf->pitch;
- else {
- rgn->pitch = 0;
- rgn->z = surf->base.u.tex.first_layer;
- rgn->w = surf->base.width;
- rgn->h = surf->base.height;
- rgn->d = u_minify(surf->base.texture->depth0, surf->base.u.tex.level);
- }
-
- nvfx_region_set_format(rgn, surf->base.format);
- if(!rgn->pitch)
- nv04_region_try_to_linearize(rgn);
-}
-
-static INLINE void
-nvfx_region_init_for_subresource(struct nv04_region* rgn, struct pipe_resource* pt, unsigned level, unsigned x, unsigned y, unsigned z, boolean for_write)
-{
- if(pt->target != PIPE_BUFFER)
- {
- struct nvfx_surface* ns = (struct nvfx_surface*)util_surfaces_peek(&((struct nvfx_miptree*)pt)->surfaces, pt, level, z);
- if(ns)
- {
- nvfx_region_init_for_surface(rgn, ns, x, y, for_write);
- return;
- }
- }
-
- rgn->bo = ((struct nvfx_resource*)pt)->bo;
- rgn->offset = nvfx_subresource_offset(pt, z, level, z);
- rgn->x = x;
- rgn->y = y;
-
- if(pt->flags & NOUVEAU_RESOURCE_FLAG_LINEAR)
- {
- rgn->pitch = nvfx_subresource_pitch(pt, level);
- rgn->z = 0;
- }
- else
- {
- rgn->pitch = 0;
- rgn->z = z;
- rgn->w = u_minify(pt->width0, level);
- rgn->h = u_minify(pt->height0, level);
- rgn->d = u_minify(pt->depth0, level);
- }
-
- nvfx_region_set_format(rgn, pt->format);
- if(!rgn->pitch)
- nv04_region_try_to_linearize(rgn);
-}
-
-// don't save index buffer because blitter doesn't setit
-static struct blitter_context*
-nvfx_get_blitter(struct pipe_context* pipe, int copy)
-{
- struct nvfx_context* nvfx = nvfx_context(pipe);
- struct blitter_context** pblitter;
- struct blitter_context* blitter;
-
- assert(nvfx->blitters_in_use < Elements(nvfx->blitter));
-
- if(nvfx->query && !nvfx->blitters_in_use)
- {
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- BEGIN_RING(chan, eng3d, NV30_3D_QUERY_ENABLE, 1);
- OUT_RING(chan, 0);
- }
-
- pblitter = &nvfx->blitter[nvfx->blitters_in_use++];
- if(!*pblitter)
- *pblitter = util_blitter_create(pipe);
- blitter = *pblitter;
-
- util_blitter_save_blend(blitter, nvfx->blend);
- util_blitter_save_depth_stencil_alpha(blitter, nvfx->zsa);
- util_blitter_save_stencil_ref(blitter, &nvfx->stencil_ref);
- util_blitter_save_rasterizer(blitter, nvfx->rasterizer);
- util_blitter_save_fragment_shader(blitter, nvfx->fragprog);
- util_blitter_save_vertex_shader(blitter, nvfx->vertprog);
- util_blitter_save_viewport(blitter, &nvfx->viewport);
- util_blitter_save_framebuffer(blitter, &nvfx->framebuffer);
- util_blitter_save_vertex_elements(blitter, nvfx->vtxelt);
- util_blitter_save_vertex_buffers(blitter, nvfx->vtxbuf_nr, nvfx->vtxbuf);
-
- if(copy)
- {
- util_blitter_save_fragment_sampler_states(blitter, nvfx->nr_samplers, (void**)nvfx->tex_sampler);
- util_blitter_save_fragment_sampler_views(blitter, nvfx->nr_textures, nvfx->fragment_sampler_views);
- }
-
- return blitter;
-}
-
-static inline void
-nvfx_put_blitter(struct pipe_context* pipe, struct blitter_context* blitter)
-{
- struct nvfx_context* nvfx = nvfx_context(pipe);
- --nvfx->blitters_in_use;
- assert(nvfx->blitters_in_use >= 0);
-
- if(nvfx->query && !nvfx->blitters_in_use)
- {
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- BEGIN_RING(chan, eng3d, NV30_3D_QUERY_ENABLE, 1);
- OUT_RING(chan, 1);
- }
-}
-
-static unsigned
-nvfx_region_clone(struct nv04_2d_context* ctx, struct nv04_region* rgn, unsigned w, unsigned h, boolean for_read)
-{
- unsigned begin = nv04_region_begin(rgn, w, h);
- unsigned end = nv04_region_end(rgn, w, h);
- unsigned size = end - begin;
- struct nouveau_bo* bo = 0;
- nouveau_bo_new(rgn->bo->device, NOUVEAU_BO_MAP | NOUVEAU_BO_GART, 256, size, &bo);
-
- if(for_read || (size > ((w * h) << rgn->bpps)))
- nv04_memcpy(ctx, bo, 0, rgn->bo, rgn->offset + begin, size);
-
- rgn->bo = bo;
- rgn->offset = -begin;
- return begin;
-}
-
-static void
-nvfx_resource_copy_region(struct pipe_context *pipe,
- struct pipe_resource *dstr, unsigned dst_level,
- unsigned dstx, unsigned dsty, unsigned dstz,
- struct pipe_resource *srcr, unsigned src_level,
- const struct pipe_box *src_box)
-{
- static int copy_threshold = -1;
- struct nv04_2d_context *ctx = nvfx_screen(pipe->screen)->eng2d;
- struct nv04_region dst, src;
- int dst_to_gpu;
- int src_on_gpu;
- boolean small;
- int ret;
- unsigned w = src_box->width;
- unsigned h = src_box->height;
-
- if(!w || !h)
- return;
-
- /* Fallback for buffers. */
- if (dstr->target == PIPE_BUFFER && srcr->target == PIPE_BUFFER) {
- util_resource_copy_region(pipe, dstr, dst_level, dstx, dsty, dstz,
- srcr, src_level, src_box);
- return;
- }
-
- if(copy_threshold < 0)
- copy_threshold = debug_get_num_option("NOUVEAU_COPY_THRESHOLD", 4);
-
- dst_to_gpu = dstr->usage != PIPE_USAGE_DYNAMIC && dstr->usage != PIPE_USAGE_STAGING;
- src_on_gpu = nvfx_resource_on_gpu(srcr);
-
- nvfx_region_init_for_subresource(&dst, dstr, dst_level, dstx, dsty, dstz, TRUE);
- nvfx_region_init_for_subresource(&src, srcr, src_level, src_box->x, src_box->y, src_box->z, FALSE);
- w = util_format_get_stride(dstr->format, w) >> dst.bpps;
- h = util_format_get_nblocksy(dstr->format, h);
-
- small = (w * h <= copy_threshold);
- if((!dst_to_gpu || !src_on_gpu) && small)
- ret = -1; /* use the CPU */
- else
- ret = nv04_region_copy_2d(ctx, &dst, &src, w, h, dst_to_gpu, src_on_gpu);
- if(!ret)
- {}
- else if(ret > 0
- && dstr->bind & (PIPE_BIND_RENDER_TARGET | PIPE_BIND_DEPTH_STENCIL)
- && srcr->bind & PIPE_BIND_SAMPLER_VIEW)
- {
- /* this currently works because we hack the bind flags on resource creation to be
- * the maximum set that the resource type actually supports
- *
- * TODO: perhaps support reinterpreting the formats
- */
- struct blitter_context* blitter = nvfx_get_blitter(pipe, 1);
- util_blitter_copy_texture(blitter, dstr, dst_level, dstx, dsty, dstz, srcr, src_level, src_box, TRUE);
- nvfx_put_blitter(pipe, blitter);
- }
- else
- {
- struct nv04_region dstt = dst;
- struct nv04_region srct = src;
- unsigned dstbegin = 0;
-
- if(!small)
- {
- if(src_on_gpu)
- nvfx_region_clone(ctx, &srct, w, h, TRUE);
-
- if(dst_to_gpu)
- dstbegin = nvfx_region_clone(ctx, &dstt, w, h, FALSE);
- }
-
- nv04_region_copy_cpu(&dstt, &srct, w, h);
-
- if(srct.bo != src.bo)
- nouveau_screen_bo_release(pipe->screen, srct.bo);
-
- if(dstt.bo != dst.bo)
- {
- nv04_memcpy(ctx, dst.bo, dst.offset + dstbegin, dstt.bo, 0, dstt.bo->size);
- nouveau_screen_bo_release(pipe->screen, dstt.bo);
- }
- }
-}
-
-static int
-nvfx_surface_fill(struct pipe_context* pipe, struct pipe_surface *dsts,
- unsigned dx, unsigned dy, unsigned w, unsigned h, unsigned value)
-{
- struct nv04_2d_context *ctx = nvfx_screen(pipe->screen)->eng2d;
- struct nv04_region dst;
- int ret;
- /* Always try to use the GPU right now, if possible
- * If the user wanted the surface data on the CPU, he would have cleared with memset (hopefully) */
-
- // we don't care about interior pixel order since we set all them to the same value
- nvfx_region_init_for_surface(&dst, (struct nvfx_surface*)dsts, dx, dy, TRUE);
-
- w = util_format_get_stride(dsts->format, w) >> dst.bpps;
- h = util_format_get_nblocksy(dsts->format, h);
-
- ret = nv04_region_fill_2d(ctx, &dst, w, h, value);
- if(ret > 0 && dsts->texture->bind & PIPE_BIND_RENDER_TARGET)
- return 1;
- else if(ret)
- {
- struct nv04_region dstt = dst;
- unsigned dstbegin = 0;
-
- if(nvfx_resource_on_gpu(dsts->texture))
- dstbegin = nvfx_region_clone(ctx, &dstt, w, h, FALSE);
-
- nv04_region_fill_cpu(&dstt, w, h, value);
-
- if(dstt.bo != dst.bo)
- {
- nv04_memcpy(ctx, dst.bo, dst.offset + dstbegin, dstt.bo, 0, dstt.bo->size);
- nouveau_screen_bo_release(pipe->screen, dstt.bo);
- }
- }
-
- return 0;
-}
-
-
-void
-nvfx_screen_surface_takedown(struct pipe_screen *pscreen)
-{
- nv04_2d_context_takedown(nvfx_screen(pscreen)->eng2d);
- nvfx_screen(pscreen)->eng2d = 0;
-}
-
-int
-nvfx_screen_surface_init(struct pipe_screen *pscreen)
-{
- struct nv04_2d_context* ctx = nv04_2d_context_init(nouveau_screen(pscreen)->channel);
- if(!ctx)
- return -1;
- nvfx_screen(pscreen)->eng2d = ctx;
- return 0;
-}
-
-static void
-nvfx_clear_render_target(struct pipe_context *pipe,
- struct pipe_surface *dst,
- const union pipe_color_union *color,
- unsigned dstx, unsigned dsty,
- unsigned width, unsigned height)
-{
- union util_color uc;
- util_pack_color(color->f, dst->format, &uc);
-
- if(util_format_get_blocksizebits(dst->format) > 32
- || nvfx_surface_fill(pipe, dst, dstx, dsty, width, height, uc.ui))
- {
- // TODO: probably should use hardware clear here instead if possible
- struct blitter_context* blitter = nvfx_get_blitter(pipe, 0);
- util_blitter_clear_render_target(blitter, dst, color, dstx, dsty, width, height);
- nvfx_put_blitter(pipe, blitter);
- }
-}
-
-static void
-nvfx_clear_depth_stencil(struct pipe_context *pipe,
- struct pipe_surface *dst,
- unsigned clear_flags,
- double depth,
- unsigned stencil,
- unsigned dstx, unsigned dsty,
- unsigned width, unsigned height)
-{
- if(util_format_get_blocksizebits(dst->format) > 32
- || nvfx_surface_fill(pipe, dst, dstx, dsty, width, height, util_pack_z_stencil(dst->format, depth, stencil)))
- {
- // TODO: probably should use hardware clear here instead if possible
- struct blitter_context* blitter = nvfx_get_blitter(pipe, 0);
- util_blitter_clear_depth_stencil(blitter, dst, clear_flags, depth, stencil, dstx, dsty, width, height);
- nvfx_put_blitter(pipe, blitter);
- }
-}
-
-
-void
-nvfx_init_surface_functions(struct nvfx_context *nvfx)
-{
- nvfx->pipe.resource_copy_region = nvfx_resource_copy_region;
- nvfx->pipe.clear_render_target = nvfx_clear_render_target;
- nvfx->pipe.clear_depth_stencil = nvfx_clear_depth_stencil;
-}
+++ /dev/null
-#ifndef NVFX_TEX_H_
-#define NVFX_TEX_H_
-
-#include "util/u_math.h"
-#include "pipe/p_defines.h"
-#include "pipe/p_state.h"
-
-
-static inline unsigned
-nvfx_tex_wrap_mode(unsigned wrap) {
- unsigned ret;
-
- switch (wrap) {
- case PIPE_TEX_WRAP_REPEAT:
- ret = NV30_3D_TEX_WRAP_S_REPEAT;
- break;
- case PIPE_TEX_WRAP_MIRROR_REPEAT:
- ret = NV30_3D_TEX_WRAP_S_MIRRORED_REPEAT;
- break;
- case PIPE_TEX_WRAP_CLAMP_TO_EDGE:
- ret = NV30_3D_TEX_WRAP_S_CLAMP_TO_EDGE;
- break;
- case PIPE_TEX_WRAP_CLAMP_TO_BORDER:
- ret = NV30_3D_TEX_WRAP_S_CLAMP_TO_BORDER;
- break;
- case PIPE_TEX_WRAP_CLAMP:
- ret = NV30_3D_TEX_WRAP_S_CLAMP;
- break;
- case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_EDGE:
- ret = NV40_3D_TEX_WRAP_S_MIRROR_CLAMP_TO_EDGE;
- break;
- case PIPE_TEX_WRAP_MIRROR_CLAMP_TO_BORDER:
- ret = NV40_3D_TEX_WRAP_S_MIRROR_CLAMP_TO_BORDER;
- break;
- case PIPE_TEX_WRAP_MIRROR_CLAMP:
- ret = NV40_3D_TEX_WRAP_S_MIRROR_CLAMP;
- break;
- default:
- assert(0);
- ret = NV30_3D_TEX_WRAP_S_REPEAT;
- break;
- }
-
- return ret >> NV30_3D_TEX_WRAP_S__SHIFT;
-}
-
-static inline unsigned
-nvfx_tex_wrap_compare_mode(unsigned func)
-{
- switch (func) {
- case PIPE_FUNC_NEVER:
- return NV30_3D_TEX_WRAP_RCOMP_NEVER;
- case PIPE_FUNC_GREATER:
- return NV30_3D_TEX_WRAP_RCOMP_GREATER;
- case PIPE_FUNC_EQUAL:
- return NV30_3D_TEX_WRAP_RCOMP_EQUAL;
- case PIPE_FUNC_GEQUAL:
- return NV30_3D_TEX_WRAP_RCOMP_GEQUAL;
- case PIPE_FUNC_LESS:
- return NV30_3D_TEX_WRAP_RCOMP_LESS;
- case PIPE_FUNC_NOTEQUAL:
- return NV30_3D_TEX_WRAP_RCOMP_NOTEQUAL;
- case PIPE_FUNC_LEQUAL:
- return NV30_3D_TEX_WRAP_RCOMP_LEQUAL;
- case PIPE_FUNC_ALWAYS:
- return NV30_3D_TEX_WRAP_RCOMP_ALWAYS;
- default:
- assert(0);
- return 0;
- }
-}
-
-static inline unsigned nvfx_tex_filter(const struct pipe_sampler_state* cso)
-{
- unsigned filter = 0;
- switch (cso->mag_img_filter) {
- case PIPE_TEX_FILTER_LINEAR:
- filter |= NV30_3D_TEX_FILTER_MAG_LINEAR;
- break;
- case PIPE_TEX_FILTER_NEAREST:
- default:
- filter |= NV30_3D_TEX_FILTER_MAG_NEAREST;
- break;
- }
-
- switch (cso->min_img_filter) {
- case PIPE_TEX_FILTER_LINEAR:
- switch (cso->min_mip_filter) {
- case PIPE_TEX_MIPFILTER_NEAREST:
- filter |= NV30_3D_TEX_FILTER_MIN_LINEAR_MIPMAP_NEAREST;
- break;
- case PIPE_TEX_MIPFILTER_LINEAR:
- filter |= NV30_3D_TEX_FILTER_MIN_LINEAR_MIPMAP_LINEAR;
- break;
- case PIPE_TEX_MIPFILTER_NONE:
- default:
- filter |= NV30_3D_TEX_FILTER_MIN_LINEAR;
- break;
- }
- break;
- case PIPE_TEX_FILTER_NEAREST:
- default:
- switch (cso->min_mip_filter) {
- case PIPE_TEX_MIPFILTER_NEAREST:
- filter |= NV30_3D_TEX_FILTER_MIN_NEAREST_MIPMAP_NEAREST;
- break;
- case PIPE_TEX_MIPFILTER_LINEAR:
- filter |= NV30_3D_TEX_FILTER_MIN_NEAREST_MIPMAP_LINEAR;
- break;
- case PIPE_TEX_MIPFILTER_NONE:
- default:
- filter |= NV30_3D_TEX_FILTER_MIN_NEAREST;
- break;
- }
- break;
- }
- return filter;
-}
-
-static inline unsigned nvfx_tex_border_color(const float* border_color)
-{
- return ((float_to_ubyte(border_color[3]) << 24) |
- (float_to_ubyte(border_color[0]) << 16) |
- (float_to_ubyte(border_color[1]) << 8) |
- (float_to_ubyte(border_color[2]) << 0));
-}
-
-struct nvfx_sampler_state {
- uint32_t fmt;
- uint32_t wrap;
- uint32_t en;
- uint32_t filt;
- uint32_t bcol;
- uint32_t min_lod;
- uint32_t max_lod;
- boolean compare;
-};
-
-struct nvfx_sampler_view {
- struct pipe_sampler_view base;
- int offset;
- uint32_t swizzle;
- uint32_t npot_size;
- uint32_t filt;
- uint32_t wrap_mask;
- uint32_t wrap;
- uint32_t lod_offset;
- uint32_t max_lod_limit;
- union
- {
- struct
- {
- uint32_t fmt[4]; /* nv30 has 4 entries, nv40 one */
- int rect;
- } nv30;
- struct
- {
- uint32_t fmt[2]; /* nv30 has 4 entries, nv40 one */
- uint32_t npot_size2; /* nv40 only */
- } nv40;
- uint32_t init_fmt;
- } u;
-};
-
-struct nvfx_texture_format {
- int fmt[6];
- unsigned sign;
- unsigned wrap;
- unsigned char src[6];
- unsigned char comp[6];
-};
-
-extern struct nvfx_texture_format nvfx_texture_formats[PIPE_FORMAT_COUNT];
-
-#endif /* NVFX_TEX_H_ */
+++ /dev/null
-#include "pipe/p_state.h"
-#include "pipe/p_defines.h"
-#include "util/u_inlines.h"
-#include "util/u_format.h"
-#include "util/u_memory.h"
-#include "util/u_math.h"
-#include "util/u_staging.h"
-#include "nvfx_context.h"
-#include "nvfx_screen.h"
-#include "nvfx_state.h"
-#include "nvfx_resource.h"
-#include "nvfx_transfer.h"
-
-struct nvfx_staging_transfer
-{
- struct util_staging_transfer base;
-
- unsigned offset;
- unsigned map_count;
-};
-
-struct pipe_transfer *
-nvfx_transfer_new(struct pipe_context *pipe,
- struct pipe_resource *pt,
- unsigned level,
- unsigned usage,
- const struct pipe_box *box)
-{
- if((usage & (PIPE_TRANSFER_UNSYNCHRONIZED | PIPE_TRANSFER_DONTBLOCK)) == PIPE_TRANSFER_DONTBLOCK)
- {
- struct nouveau_bo* bo = ((struct nvfx_resource*)pt)->bo;
- if(bo && nouveau_bo_busy(bo, NOUVEAU_BO_WR))
- return NULL;
- }
-
- if(pt->target == PIPE_BUFFER)
- {
- // it would be nice if we could avoid all this ridiculous overhead...
- struct pipe_transfer* tx;
- struct nvfx_buffer* buffer = nvfx_buffer(pt);
-
- tx = CALLOC_STRUCT(pipe_transfer);
- if (!tx)
- return NULL;
-
- pipe_resource_reference(&tx->resource, pt);
- tx->level = level;
- tx->usage = usage;
- tx->box = *box;
-
- tx->layer_stride = tx->stride = util_format_get_stride(pt->format, box->width);
- tx->data = buffer->data + util_format_get_stride(pt->format, box->x);
-
- return tx;
- }
- else
- {
- struct nvfx_staging_transfer* tx;
- boolean direct = !nvfx_resource_on_gpu(pt) && pt->flags & NOUVEAU_RESOURCE_FLAG_LINEAR;
-
- tx = CALLOC_STRUCT(nvfx_staging_transfer);
- if(!tx)
- return NULL;
-
- util_staging_transfer_init(pipe, pt, level, usage, box, direct, &tx->base);
-
- if(direct)
- {
- tx->base.base.stride = nvfx_subresource_pitch(pt, level);
- tx->base.base.layer_stride = tx->base.base.stride * u_minify(pt->height0, level);
- tx->offset = nvfx_subresource_offset(pt, box->z, level, box->z)
- + util_format_get_2d_size(pt->format, tx->base.base.stride, box->y)
- + util_format_get_stride(pt->format, box->x);
- }
- else
- {
- tx->base.base.stride = nvfx_subresource_pitch(tx->base.staging_resource, 0);
- tx->base.base.layer_stride = tx->base.base.stride * tx->base.staging_resource->height0;
- tx->offset = 0;
- }
-
- assert(tx->base.base.stride);
-
- return &tx->base.base;
- }
-}
-
-static void nvfx_buffer_dirty_interval(struct nvfx_buffer* buffer, unsigned begin, unsigned size, boolean unsynchronized)
-{
- struct nvfx_screen* screen = nvfx_screen(buffer->base.base.screen);
- buffer->last_update_static = buffer->bytes_to_draw_until_static < 0;
- if(buffer->dirty_begin == buffer->dirty_end)
- {
- buffer->dirty_begin = begin;
- buffer->dirty_end = begin + size;
- buffer->dirty_unsynchronized = unsynchronized;
- }
- else
- {
- buffer->dirty_begin = MIN2(buffer->dirty_begin, begin);
- buffer->dirty_end = MAX2(buffer->dirty_end, begin + size);
- buffer->dirty_unsynchronized &= unsynchronized;
- }
-
- if(unsynchronized)
- {
- // TODO: revisit this, it doesn't seem quite right
- //printf("UNSYNC UPDATE %p %u %u\n", buffer, begin, size);
- buffer->bytes_to_draw_until_static += size * screen->static_reuse_threshold;
- }
- else
- buffer->bytes_to_draw_until_static = buffer->size * screen->static_reuse_threshold;
-}
-
-static void nvfx_transfer_flush_region( struct pipe_context *pipe,
- struct pipe_transfer *ptx,
- const struct pipe_box *box)
-{
- if(ptx->resource->target == PIPE_BUFFER && (ptx->usage & PIPE_TRANSFER_FLUSH_EXPLICIT))
- {
- struct nvfx_buffer* buffer = nvfx_buffer(ptx->resource);
- nvfx_buffer_dirty_interval(buffer,
- (uint8_t*)ptx->data - buffer->data + util_format_get_stride(buffer->base.base.format, box->x),
- util_format_get_stride(buffer->base.base.format, box->width),
- !!(ptx->usage & PIPE_TRANSFER_UNSYNCHRONIZED));
- }
-}
-
-static void
-nvfx_transfer_destroy(struct pipe_context *pipe, struct pipe_transfer *ptx)
-{
- if(ptx->resource->target == PIPE_BUFFER)
- {
- struct nvfx_buffer* buffer = nvfx_buffer(ptx->resource);
- if((ptx->usage & (PIPE_TRANSFER_WRITE | PIPE_TRANSFER_FLUSH_EXPLICIT)) == PIPE_TRANSFER_WRITE)
- nvfx_buffer_dirty_interval(buffer,
- (uint8_t*)ptx->data - buffer->data,
- ptx->stride,
- !!(ptx->usage & PIPE_TRANSFER_UNSYNCHRONIZED));
- pipe_resource_reference(&ptx->resource, 0);
- FREE(ptx);
- }
- else
- {
- struct nouveau_channel* chan = nvfx_context(pipe)->screen->base.channel;
- util_staging_transfer_destroy(pipe, ptx);
-
- FIRE_RING(chan);
- }
-}
-
-void *
-nvfx_transfer_map(struct pipe_context *pipe, struct pipe_transfer *ptx)
-{
- if(ptx->resource->target == PIPE_BUFFER)
- return ptx->data;
- else
- {
- struct nvfx_staging_transfer *tx = (struct nvfx_staging_transfer *)ptx;
- if(!ptx->data)
- {
- struct nvfx_miptree *mt = (struct nvfx_miptree *)tx->base.staging_resource;
- uint8_t *map = nouveau_screen_bo_map(pipe->screen, mt->base.bo, nouveau_screen_transfer_flags(ptx->usage));
- ptx->data = map + tx->offset;
- }
-
- ++tx->map_count;
- return ptx->data;
- }
-}
-
-void
-nvfx_transfer_unmap(struct pipe_context *pipe, struct pipe_transfer *ptx)
-{
- if(ptx->resource->target != PIPE_BUFFER)
- {
- struct nvfx_staging_transfer *tx = (struct nvfx_staging_transfer *)ptx;
- struct nvfx_miptree *mt = (struct nvfx_miptree *)tx->base.staging_resource;
-
- if(!--tx->map_count)
- {
- nouveau_screen_bo_unmap(pipe->screen, mt->base.bo);
- ptx->data = 0;
- }
- }
-}
-
-static void nvfx_transfer_inline_write( struct pipe_context *pipe,
- struct pipe_resource *pr,
- unsigned level,
- unsigned usage,
- const struct pipe_box *box,
- const void *data,
- unsigned stride,
- unsigned slice_stride)
-{
- if(pr->target != PIPE_BUFFER)
- {
- u_default_transfer_inline_write(pipe, pr, level, usage, box, data, stride, slice_stride);
- }
- else
- {
- struct nvfx_buffer* buffer = nvfx_buffer(pr);
- unsigned begin = util_format_get_stride(pr->format, box->x);
- unsigned size = util_format_get_stride(pr->format, box->width);
- memcpy(buffer->data + begin, data, size);
- nvfx_buffer_dirty_interval(buffer, begin, size,
- !!(pr->flags & PIPE_TRANSFER_UNSYNCHRONIZED));
- }
-}
-
-void
-nvfx_init_transfer_functions(struct pipe_context *pipe)
-{
- pipe->get_transfer = nvfx_transfer_new;
- pipe->transfer_map = nvfx_transfer_map;
- pipe->transfer_flush_region = nvfx_transfer_flush_region;
- pipe->transfer_unmap = nvfx_transfer_unmap;
- pipe->transfer_destroy = nvfx_transfer_destroy;
- pipe->transfer_inline_write = nvfx_transfer_inline_write;
-}
+++ /dev/null
-
-#ifndef NVFX_TRANSFER_H
-#define NVFX_TRANSFER_H
-
-#include "util/u_transfer.h"
-#include "pipe/p_state.h"
-
-
-struct pipe_transfer *
-nvfx_transfer_new(struct pipe_context *pcontext,
- struct pipe_resource *pt,
- unsigned level,
- unsigned usage,
- const struct pipe_box *box);
-
-void *
-nvfx_transfer_map(struct pipe_context *pcontext,
- struct pipe_transfer *ptx);
-void
-nvfx_transfer_unmap(struct pipe_context *pcontext,
- struct pipe_transfer *ptx);
-
-
-#endif
+++ /dev/null
-#include "pipe/p_context.h"
-#include "pipe/p_state.h"
-#include "util/u_inlines.h"
-#include "util/u_format.h"
-#include "util/u_transfer.h"
-#include "translate/translate.h"
-
-#include "nvfx_context.h"
-#include "nvfx_state.h"
-#include "nvfx_resource.h"
-
-#include "nouveau/nouveau_channel.h"
-#include "nouveau/nv04_pushbuf.h"
-
-static inline unsigned
-util_guess_unique_indices_count(unsigned mode, unsigned indices)
-{
- /* Euler's formula gives V =
- * = E - F + 2 =
- * = F * (polygon_edges / 2 - 1) + 2 =
- * = F * (polygon_edges - 2) / 2 + 2 =
- * = indices * (polygon_edges - 2) / (2 * indices_per_face) + 2
- * = indices * (1 / 2 - 1 / polygon_edges) + 2
- */
- switch(mode)
- {
- case PIPE_PRIM_LINES:
- return indices >> 1;
- case PIPE_PRIM_TRIANGLES:
- {
- // avoid an expensive division by 3 using the multiplicative inverse mod 2^32
- unsigned q;
- unsigned inv3 = 2863311531;
- indices >>= 1;
- q = indices * inv3;
- if(unlikely(q >= indices))
- {
- q += inv3;
- if(q >= indices)
- q += inv3;
- }
- return indices + 2;
- //return indices / 6 + 2;
- }
- // guess that indexed quads are created by successive connections, since a closed mesh seems unlikely
- case PIPE_PRIM_QUADS:
- return (indices >> 1) + 2;
- // return (indices >> 2) + 2; // if it is a closed mesh
- default:
- return indices;
- }
-}
-
-static unsigned nvfx_decide_upload_mode(struct pipe_context *pipe, const struct pipe_draw_info *info)
-{
- struct nvfx_context* nvfx = nvfx_context(pipe);
- unsigned hardware_cost = 0;
- unsigned inline_cost = 0;
- unsigned unique_vertices;
- unsigned upload_mode;
- float best_index_cost_for_hardware_vertices_as_inline_cost;
- boolean prefer_hardware_indices;
- unsigned index_inline_cost;
- unsigned index_hardware_cost;
- if (info->indexed)
- unique_vertices = util_guess_unique_indices_count(info->mode, info->count);
- else
- unique_vertices = info->count;
-
- /* Here we try to figure out if we are better off writing vertex data directly on the FIFO,
- * or create hardware buffer objects and pointing the hardware to them.
- *
- * This is done by computing the total memcpy cost of each option, ignoring uploads
- * if we think that the buffer is static and thus the upload cost will be amortized over
- * future draw calls.
- *
- * For instance, if everything looks static, we will always create buffer objects, while if
- * everything is a user buffer and we are not doing indexed drawing, we never do.
- *
- * Other interesting cases are where a small user vertex buffer, but a huge user index buffer,
- * where we will upload the vertex buffer, so that we can use hardware index lookup, and
- * the opposite case, where we instead do index lookup in software to avoid uploading
- * a huge amount of vertex data that is not going to be used.
- *
- * Otherwise, we generally move to the GPU the after it has been pushed
- * NVFX_STATIC_BUFFER_MIN_REUSE_TIMES times to the GPU without having
- * been updated with a transfer (or just the buffer having been destroyed).
- *
- * There is no special handling for user buffers, since applications can use
- * OpenGL VBOs in a one-shot fashion. OpenGL 3/4 core profile forces this
- * by the way.
- *
- * Note that currently we don't support only putting some data on the FIFO, and
- * some on vertex buffers (constant and instanced data is independent from this).
- *
- * nVidia doesn't seem to do this either, even though it should be at least
- * doable with VTX_ATTR and possibly with VERTEX_DATA too if not indexed.
- */
-
- for (unsigned i = 0; i < nvfx->vtxelt->num_per_vertex_buffer_infos; i++)
- {
- struct nvfx_per_vertex_buffer_info* vbi = &nvfx->vtxelt->per_vertex_buffer_info[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[vbi->vertex_buffer_index];
- struct nvfx_buffer* buffer = nvfx_buffer(vb->buffer);
- buffer->bytes_to_draw_until_static -= vbi->per_vertex_size * unique_vertices;
- if (!nvfx_buffer_seems_static(buffer))
- {
- hardware_cost += buffer->dirty_end - buffer->dirty_begin;
- if (!buffer->base.bo)
- hardware_cost += nvfx->screen->buffer_allocation_cost;
- }
- inline_cost += vbi->per_vertex_size * info->count;
- }
-
- best_index_cost_for_hardware_vertices_as_inline_cost = 0.0f;
- prefer_hardware_indices = FALSE;
- index_inline_cost = 0;
- index_hardware_cost = 0;
-
- if (info->indexed)
- {
- index_inline_cost = nvfx->idxbuf.index_size * info->count;
- if (nvfx->screen->index_buffer_reloc_flags
- && (nvfx->idxbuf.index_size == 2 || nvfx->idxbuf.index_size == 4)
- && !(nvfx->idxbuf.offset & (nvfx->idxbuf.index_size - 1)))
- {
- struct nvfx_buffer* buffer = nvfx_buffer(nvfx->idxbuf.buffer);
- buffer->bytes_to_draw_until_static -= index_inline_cost;
-
- prefer_hardware_indices = TRUE;
-
- if (!nvfx_buffer_seems_static(buffer))
- {
- index_hardware_cost = buffer->dirty_end - buffer->dirty_begin;
- if (!buffer->base.bo)
- index_hardware_cost += nvfx->screen->buffer_allocation_cost;
- }
-
- if ((float) index_inline_cost < (float) index_hardware_cost * nvfx->screen->inline_cost_per_hardware_cost)
- {
- best_index_cost_for_hardware_vertices_as_inline_cost = (float) index_inline_cost;
- }
- else
- {
- best_index_cost_for_hardware_vertices_as_inline_cost = (float) index_hardware_cost * nvfx->screen->inline_cost_per_hardware_cost;
- prefer_hardware_indices = TRUE;
- }
- }
- }
-
- /* let's finally figure out which of the 3 paths we want to take */
- if ((float) (inline_cost + index_inline_cost) > ((float) hardware_cost * nvfx->screen->inline_cost_per_hardware_cost + best_index_cost_for_hardware_vertices_as_inline_cost))
- upload_mode = 1 + prefer_hardware_indices;
- else
- upload_mode = 0;
-
-#ifdef DEBUG
- if (unlikely(nvfx->screen->trace_draw))
- {
- fprintf(stderr, "DRAW");
- if (info->indexed)
- {
- fprintf(stderr, "_IDX%u", nvfx->idxbuf.index_size);
- if (info->index_bias)
- fprintf(stderr, " biased %u", info->index_bias);
- fprintf(stderr, " idxrange %u -> %u", info->min_index, info->max_index);
- }
- if (info->instance_count > 1)
- fprintf(stderr, " %u instances from %u", info->instance_count, info->indexed);
- fprintf(stderr, " start %u count %u prim %u", info->start, info->count, info->mode);
- if (!upload_mode)
- fprintf(stderr, " -> inline vertex data");
- else if (upload_mode == 2 || !info->indexed)
- fprintf(stderr, " -> buffer range");
- else
- fprintf(stderr, " -> inline indices");
- fprintf(stderr, " [ivtx %u hvtx %u iidx %u hidx %u bidx %f] <", inline_cost, hardware_cost, index_inline_cost, index_hardware_cost, best_index_cost_for_hardware_vertices_as_inline_cost);
- for (unsigned i = 0; i < nvfx->vtxelt->num_per_vertex_buffer_infos; ++i)
- {
- struct nvfx_per_vertex_buffer_info* vbi = &nvfx->vtxelt->per_vertex_buffer_info[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[vbi->vertex_buffer_index];
- struct nvfx_buffer* buffer = nvfx_buffer(vb->buffer);
- if (i)
- fprintf(stderr, ", ");
- fprintf(stderr, "%p%s left %Li", buffer, buffer->last_update_static ? " static" : "", buffer->bytes_to_draw_until_static);
- }
- fprintf(stderr, ">\n");
- }
-#endif
-
- return upload_mode;
-}
-
-void nvfx_draw_vbo(struct pipe_context *pipe, const struct pipe_draw_info *info)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- unsigned upload_mode = 0;
-
- if (!nvfx->vtxelt->needs_translate)
- upload_mode = nvfx_decide_upload_mode(pipe, info);
-
- nvfx->use_index_buffer = upload_mode > 1;
-
- if ((upload_mode > 0) != nvfx->use_vertex_buffers)
- {
- nvfx->use_vertex_buffers = (upload_mode > 0);
- nvfx->dirty |= NVFX_NEW_ARRAYS;
- nvfx->draw_dirty |= NVFX_NEW_ARRAYS;
- }
-
- if (upload_mode > 0)
- {
- for (unsigned i = 0; i < nvfx->vtxelt->num_per_vertex_buffer_infos; i++)
- {
- struct nvfx_per_vertex_buffer_info* vbi = &nvfx->vtxelt->per_vertex_buffer_info[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[vbi->vertex_buffer_index];
- nvfx_buffer_upload(nvfx_buffer(vb->buffer));
- }
-
- if (upload_mode > 1)
- {
- nvfx_buffer_upload(nvfx_buffer(nvfx->idxbuf.buffer));
-
- if (unlikely(info->index_bias != nvfx->base_vertex))
- {
- nvfx->base_vertex = info->index_bias;
- nvfx->dirty |= NVFX_NEW_ARRAYS;
- }
- }
- else
- {
- if (unlikely(info->start < nvfx->base_vertex && nvfx->base_vertex))
- {
- nvfx->base_vertex = 0;
- nvfx->dirty |= NVFX_NEW_ARRAYS;
- }
- }
- }
-
- if (nvfx->screen->force_swtnl || !nvfx_state_validate(nvfx))
- nvfx_draw_vbo_swtnl(pipe, info);
- else
- nvfx_push_vbo(pipe, info);
-}
-
-boolean
-nvfx_vbo_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- int i;
- int elements = MAX2(nvfx->vtxelt->num_elements, nvfx->hw_vtxelt_nr);
- unsigned vb_flags = nvfx->screen->vertex_buffer_reloc_flags | NOUVEAU_BO_RD;
-
- if (!elements)
- return TRUE;
-
- MARK_RING(chan, (5 + 2) * 16 + 2 + 11, 16 + 2);
- for(unsigned i = 0; i < nvfx->vtxelt->num_constant; ++i)
- {
- struct nvfx_low_frequency_element *ve = &nvfx->vtxelt->constant[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[ve->vertex_buffer_index];
- struct nvfx_buffer* buffer = nvfx_buffer(vb->buffer);
- float v[4];
- ve->fetch_rgba_float(v, buffer->data + vb->buffer_offset + ve->src_offset, 0, 0);
- nvfx_emit_vtx_attr(chan, eng3d, ve->idx, v, ve->ncomp);
- }
-
-
- BEGIN_RING(chan, eng3d, NV30_3D_VTXFMT(0), elements);
- if(nvfx->use_vertex_buffers)
- {
- unsigned idx = 0;
- for (i = 0; i < nvfx->vtxelt->num_per_vertex; i++) {
- struct nvfx_per_vertex_element *ve = &nvfx->vtxelt->per_vertex[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[ve->vertex_buffer_index];
-
- if(idx != ve->idx)
- {
- assert(idx < ve->idx);
- OUT_RINGp(chan, &nvfx->vtxelt->vtxfmt[idx], ve->idx - idx);
- idx = ve->idx;
- }
-
- OUT_RING(chan, nvfx->vtxelt->vtxfmt[idx] | (vb->stride << NV30_3D_VTXFMT_STRIDE__SHIFT));
- ++idx;
- }
- if(idx != nvfx->vtxelt->num_elements)
- OUT_RINGp(chan, &nvfx->vtxelt->vtxfmt[idx], nvfx->vtxelt->num_elements - idx);
- }
- else
- OUT_RINGp(chan, nvfx->vtxelt->vtxfmt, nvfx->vtxelt->num_elements);
-
- for(i = nvfx->vtxelt->num_elements; i < elements; ++i)
- OUT_RING(chan, NV30_3D_VTXFMT_TYPE_V32_FLOAT);
-
- if(nvfx->is_nv4x) {
- unsigned i;
- /* seems to be some kind of cache flushing */
- for(i = 0; i < 3; ++i) {
- BEGIN_RING(chan, eng3d, 0x1718, 1);
- OUT_RING(chan, 0);
- }
- }
-
- BEGIN_RING(chan, eng3d, NV30_3D_VTXBUF(0), elements);
- if(nvfx->use_vertex_buffers)
- {
- unsigned idx = 0;
- for (i = 0; i < nvfx->vtxelt->num_per_vertex; i++) {
- struct nvfx_per_vertex_element *ve = &nvfx->vtxelt->per_vertex[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[ve->vertex_buffer_index];
- struct nouveau_bo* bo = nvfx_resource(vb->buffer)->bo;
-
- for(; idx < ve->idx; ++idx)
- OUT_RING(chan, 0);
-
- OUT_RELOC(chan, bo,
- vb->buffer_offset + ve->src_offset + nvfx->base_vertex * vb->stride,
- vb_flags | NOUVEAU_BO_LOW | NOUVEAU_BO_OR,
- 0, NV30_3D_VTXBUF_DMA1);
- ++idx;
- }
-
- for(; idx < elements; ++idx)
- OUT_RING(chan, 0);
- }
- else
- {
- for (i = 0; i < elements; i++)
- OUT_RING(chan, 0);
- }
-
- BEGIN_RING(chan, eng3d, 0x1710, 1);
- OUT_RING(chan, 0);
-
- nvfx->hw_vtxelt_nr = nvfx->vtxelt->num_elements;
- nvfx->relocs_needed &=~ NVFX_RELOCATE_VTXBUF;
- return TRUE;
-}
-
-void
-nvfx_vbo_swtnl_validate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- struct nouveau_grobj *eng3d = nvfx->screen->eng3d;
- unsigned num_outputs = nvfx->vertprog->draw_elements;
- int elements = MAX2(num_outputs, nvfx->hw_vtxelt_nr);
-
- if (!elements)
- return;
-
- BEGIN_RING(chan, eng3d, NV30_3D_VTXFMT(0), elements);
- for(unsigned i = 0; i < num_outputs; ++i)
- OUT_RING(chan, (4 << NV30_3D_VTXFMT_SIZE__SHIFT) | NV30_3D_VTXFMT_TYPE_V32_FLOAT);
- for(unsigned i = num_outputs; i < elements; ++i)
- OUT_RING(chan, NV30_3D_VTXFMT_TYPE_V32_FLOAT);
-
- if(nvfx->is_nv4x) {
- unsigned i;
- /* seems to be some kind of cache flushing */
- for(i = 0; i < 3; ++i) {
- BEGIN_RING(chan, eng3d, 0x1718, 1);
- OUT_RING(chan, 0);
- }
- }
-
- BEGIN_RING(chan, eng3d, NV30_3D_VTXBUF(0), elements);
- for (unsigned i = 0; i < elements; i++)
- OUT_RING(chan, 0);
-
- BEGIN_RING(chan, eng3d, 0x1710, 1);
- OUT_RING(chan, 0);
-
- nvfx->hw_vtxelt_nr = num_outputs;
- nvfx->relocs_needed &=~ NVFX_RELOCATE_VTXBUF;
-}
-
-void
-nvfx_vbo_relocate(struct nvfx_context *nvfx)
-{
- struct nouveau_channel* chan;
- unsigned vb_flags;
- int i;
-
- if(!nvfx->use_vertex_buffers)
- return;
-
- chan = nvfx->screen->base.channel;
- vb_flags = nvfx->screen->vertex_buffer_reloc_flags | NOUVEAU_BO_RD | NOUVEAU_BO_DUMMY;
-
- MARK_RING(chan, 2 * 16 + 3, 2 * 16 + 3);
- for (i = 0; i < nvfx->vtxelt->num_per_vertex; i++) {
- struct nvfx_per_vertex_element *ve = &nvfx->vtxelt->per_vertex[i];
- struct pipe_vertex_buffer *vb = &nvfx->vtxbuf[ve->vertex_buffer_index];
- struct nouveau_bo* bo = nvfx_resource(vb->buffer)->bo;
-
- OUT_RELOC(chan, bo, RING_3D(NV30_3D_VTXBUF(ve->idx), 1),
- vb_flags, 0, 0);
- OUT_RELOC(chan, bo, vb->buffer_offset + ve->src_offset + nvfx->base_vertex * vb->stride,
- vb_flags | NOUVEAU_BO_LOW | NOUVEAU_BO_OR,
- 0, NV30_3D_VTXBUF_DMA1);
- }
- nvfx->relocs_needed &=~ NVFX_RELOCATE_VTXBUF;
-}
-
-static void
-nvfx_idxbuf_emit(struct nvfx_context* nvfx, unsigned ib_flags)
-{
- struct nouveau_channel* chan = nvfx->screen->base.channel;
- unsigned ib_format = (nvfx->idxbuf.index_size == 2) ? NV30_3D_IDXBUF_FORMAT_TYPE_U16 : NV30_3D_IDXBUF_FORMAT_TYPE_U32;
- struct nouveau_bo* bo = nvfx_resource(nvfx->idxbuf.buffer)->bo;
- ib_flags |= nvfx->screen->index_buffer_reloc_flags | NOUVEAU_BO_RD;
-
- assert(nvfx->screen->index_buffer_reloc_flags);
-
- MARK_RING(chan, 3, 3);
- if(ib_flags & NOUVEAU_BO_DUMMY)
- OUT_RELOC(chan, bo, RING_3D(NV30_3D_IDXBUF_OFFSET, 2), ib_flags, 0, 0);
- else
- OUT_RING(chan, RING_3D(NV30_3D_IDXBUF_OFFSET, 2));
- OUT_RELOC(chan, bo, nvfx->idxbuf.offset + 1, ib_flags | NOUVEAU_BO_LOW, 0, 0);
- OUT_RELOC(chan, bo, ib_format, ib_flags | NOUVEAU_BO_OR,
- 0, NV30_3D_IDXBUF_FORMAT_DMA1);
- nvfx->relocs_needed &=~ NVFX_RELOCATE_IDXBUF;
-}
-
-void
-nvfx_idxbuf_validate(struct nvfx_context* nvfx)
-{
- nvfx_idxbuf_emit(nvfx, 0);
-}
-
-void
-nvfx_idxbuf_relocate(struct nvfx_context* nvfx)
-{
- nvfx_idxbuf_emit(nvfx, NOUVEAU_BO_DUMMY);
-}
-
-unsigned nvfx_vertex_formats[PIPE_FORMAT_COUNT] =
-{
- [PIPE_FORMAT_R32_FLOAT] = NV30_3D_VTXFMT_TYPE_V32_FLOAT,
- [PIPE_FORMAT_R32G32_FLOAT] = NV30_3D_VTXFMT_TYPE_V32_FLOAT,
- [PIPE_FORMAT_R32G32B32_FLOAT] = NV30_3D_VTXFMT_TYPE_V32_FLOAT,
- [PIPE_FORMAT_R32G32B32A32_FLOAT] = NV30_3D_VTXFMT_TYPE_V32_FLOAT,
- [PIPE_FORMAT_R16_FLOAT] = NV30_3D_VTXFMT_TYPE_V16_FLOAT,
- [PIPE_FORMAT_R16G16_FLOAT] = NV30_3D_VTXFMT_TYPE_V16_FLOAT,
- [PIPE_FORMAT_R16G16B16_FLOAT] = NV30_3D_VTXFMT_TYPE_V16_FLOAT,
- [PIPE_FORMAT_R16G16B16A16_FLOAT] = NV30_3D_VTXFMT_TYPE_V16_FLOAT,
- [PIPE_FORMAT_R8_UNORM] = NV30_3D_VTXFMT_TYPE_U8_UNORM,
- [PIPE_FORMAT_R8G8_UNORM] = NV30_3D_VTXFMT_TYPE_U8_UNORM,
- [PIPE_FORMAT_R8G8B8_UNORM] = NV30_3D_VTXFMT_TYPE_U8_UNORM,
- [PIPE_FORMAT_R8G8B8A8_UNORM] = NV30_3D_VTXFMT_TYPE_U8_UNORM,
- [PIPE_FORMAT_R8G8B8A8_USCALED] = NV30_3D_VTXFMT_TYPE_U8_USCALED,
- [PIPE_FORMAT_R16_SNORM] = NV30_3D_VTXFMT_TYPE_V16_SNORM,
- [PIPE_FORMAT_R16G16_SNORM] = NV30_3D_VTXFMT_TYPE_V16_SNORM,
- [PIPE_FORMAT_R16G16B16_SNORM] = NV30_3D_VTXFMT_TYPE_V16_SNORM,
- [PIPE_FORMAT_R16G16B16A16_SNORM] = NV30_3D_VTXFMT_TYPE_V16_SNORM,
- [PIPE_FORMAT_R16_SSCALED] = NV30_3D_VTXFMT_TYPE_V16_SSCALED,
- [PIPE_FORMAT_R16G16_SSCALED] = NV30_3D_VTXFMT_TYPE_V16_SSCALED,
- [PIPE_FORMAT_R16G16B16_SSCALED] = NV30_3D_VTXFMT_TYPE_V16_SSCALED,
- [PIPE_FORMAT_R16G16B16A16_SSCALED] = NV30_3D_VTXFMT_TYPE_V16_SSCALED,
-};
-
-static void *
-nvfx_vtxelts_state_create(struct pipe_context *pipe,
- unsigned num_elements,
- const struct pipe_vertex_element *elements)
-{
- struct nvfx_vtxelt_state *cso = CALLOC_STRUCT(nvfx_vtxelt_state);
- struct translate_key transkey;
- unsigned per_vertex_size[16];
- unsigned vb_compacted_index[16];
-
- if(num_elements > 16)
- {
- _debug_printf("Error: application attempted to use %u vertex elements, but only 16 are supported: ignoring the rest\n", num_elements);
- num_elements = 16;
- }
-
- memset(per_vertex_size, 0, sizeof(per_vertex_size));
- memcpy(cso->pipe, elements, num_elements * sizeof(elements[0]));
- cso->num_elements = num_elements;
- cso->needs_translate = FALSE;
-
- transkey.nr_elements = 0;
- transkey.output_stride = 0;
-
- for(unsigned i = 0; i < num_elements; ++i)
- {
- const struct pipe_vertex_element* ve = &elements[i];
- if(!ve->instance_divisor)
- per_vertex_size[ve->vertex_buffer_index] += util_format_get_stride(ve->src_format, 1);
- }
-
- for(unsigned i = 0; i < 16; ++i)
- {
- if(per_vertex_size[i])
- {
- unsigned idx = cso->num_per_vertex_buffer_infos++;
- cso->per_vertex_buffer_info[idx].vertex_buffer_index = i;
- cso->per_vertex_buffer_info[idx].per_vertex_size = per_vertex_size[i];
- vb_compacted_index[i] = idx;
- }
- }
-
- for(unsigned i = 0; i < num_elements; ++i)
- {
- const struct pipe_vertex_element* ve = &elements[i];
- unsigned type = nvfx_vertex_formats[ve->src_format];
- unsigned ncomp = util_format_get_nr_components(ve->src_format);
-
- //if(ve->frequency != PIPE_ELEMENT_FREQUENCY_PER_VERTEX)
- if(ve->instance_divisor)
- {
- struct nvfx_low_frequency_element* lfve;
- cso->vtxfmt[i] = NV30_3D_VTXFMT_TYPE_V32_FLOAT;
-
- //if(ve->frequency == PIPE_ELEMENT_FREQUENCY_CONSTANT)
- if(0)
- lfve = &cso->constant[cso->num_constant++];
- else
- {
- lfve = &cso->per_instance[cso->num_per_instance++].base;
- ((struct nvfx_per_instance_element*)lfve)->instance_divisor = ve->instance_divisor;
- }
-
- lfve->idx = i;
- lfve->vertex_buffer_index = ve->vertex_buffer_index;
- lfve->src_offset = ve->src_offset;
- lfve->fetch_rgba_float = util_format_description(ve->src_format)->fetch_rgba_float;
- lfve->ncomp = ncomp;
- }
- else
- {
- unsigned idx;
-
- idx = cso->num_per_vertex++;
- cso->per_vertex[idx].idx = i;
- cso->per_vertex[idx].vertex_buffer_index = ve->vertex_buffer_index;
- cso->per_vertex[idx].src_offset = ve->src_offset;
-
- idx = transkey.nr_elements++;
- transkey.element[idx].input_format = ve->src_format;
- transkey.element[idx].input_buffer = vb_compacted_index[ve->vertex_buffer_index];
- transkey.element[idx].input_offset = ve->src_offset;
- transkey.element[idx].instance_divisor = 0;
- transkey.element[idx].type = TRANSLATE_ELEMENT_NORMAL;
- if(type)
- {
- transkey.element[idx].output_format = ve->src_format;
- cso->vtxfmt[i] = (ncomp << NV30_3D_VTXFMT_SIZE__SHIFT) | type;
- }
- else
- {
- unsigned float32[4] = {PIPE_FORMAT_R32_FLOAT, PIPE_FORMAT_R32G32_FLOAT, PIPE_FORMAT_R32G32B32_FLOAT, PIPE_FORMAT_R32G32B32A32_FLOAT};
- transkey.element[idx].output_format = float32[ncomp - 1];
- cso->needs_translate = TRUE;
- cso->vtxfmt[i] = (ncomp << NV30_3D_VTXFMT_SIZE__SHIFT) | NV30_3D_VTXFMT_TYPE_V32_FLOAT;
- }
- transkey.element[idx].output_offset = transkey.output_stride;
- transkey.output_stride += (util_format_get_stride(transkey.element[idx].output_format, 1) + 3) & ~3;
- }
- }
-
- cso->translate = translate_create(&transkey);
- cso->vertex_length = transkey.output_stride >> 2;
- cso->max_vertices_per_packet = 2047 / MAX2(cso->vertex_length, 1);
-
- return (void *)cso;
-}
-
-static void
-nvfx_vtxelts_state_delete(struct pipe_context *pipe, void *hwcso)
-{
- FREE(hwcso);
-}
-
-static void
-nvfx_vtxelts_state_bind(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->vtxelt = hwcso;
- nvfx->use_vertex_buffers = -1;
- nvfx->draw_dirty |= NVFX_NEW_ARRAYS;
-}
-
-static void
-nvfx_set_vertex_buffers(struct pipe_context *pipe, unsigned count,
- const struct pipe_vertex_buffer *vb)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- util_copy_vertex_buffers(nvfx->vtxbuf,
- &nvfx->vtxbuf_nr,
- vb, count);
-
- nvfx->use_vertex_buffers = -1;
- nvfx->draw_dirty |= NVFX_NEW_ARRAYS;
-}
-
-static void
-nvfx_set_index_buffer(struct pipe_context *pipe,
- const struct pipe_index_buffer *ib)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- if(ib)
- {
- pipe_resource_reference(&nvfx->idxbuf.buffer, ib->buffer);
- nvfx->idxbuf.index_size = ib->index_size;
- nvfx->idxbuf.offset = ib->offset;
- }
- else
- {
- pipe_resource_reference(&nvfx->idxbuf.buffer, 0);
- nvfx->idxbuf.index_size = 0;
- nvfx->idxbuf.offset = 0;
- }
-
- nvfx->dirty |= NVFX_NEW_INDEX;
- nvfx->draw_dirty |= NVFX_NEW_INDEX;
-}
-
-void
-nvfx_init_vbo_functions(struct nvfx_context *nvfx)
-{
- nvfx->pipe.set_vertex_buffers = nvfx_set_vertex_buffers;
- nvfx->pipe.set_index_buffer = nvfx_set_index_buffer;
-
- nvfx->pipe.create_vertex_elements_state = nvfx_vtxelts_state_create;
- nvfx->pipe.delete_vertex_elements_state = nvfx_vtxelts_state_delete;
- nvfx->pipe.bind_vertex_elements_state = nvfx_vtxelts_state_bind;
-
- nvfx->pipe.redefine_user_buffer = u_default_redefine_user_buffer;
-}
+++ /dev/null
-#include "pipe/p_context.h"
-#include "pipe/p_defines.h"
-#include "pipe/p_state.h"
-#include "util/u_linkage.h"
-#include "util/u_debug.h"
-
-#include "pipe/p_shader_tokens.h"
-#include "tgsi/tgsi_parse.h"
-#include "tgsi/tgsi_dump.h"
-#include "tgsi/tgsi_util.h"
-#include "tgsi/tgsi_ureg.h"
-
-#include "draw/draw_context.h"
-
-#include "nvfx_context.h"
-#include "nvfx_state.h"
-#include "nvfx_resource.h"
-
-/* TODO (at least...):
- * 1. Indexed consts + ARL
- * 3. NV_vp11, NV_vp2, NV_vp3 features
- * - extra arith opcodes
- * - branching
- * - texture sampling
- * - indexed attribs
- * - indexed results
- * 4. bugs
- */
-
-#include "nv30_vertprog.h"
-#include "nv40_vertprog.h"
-
-struct nvfx_loop_entry
-{
- unsigned brk_target;
- unsigned cont_target;
-};
-
-struct nvfx_vpc {
- struct nvfx_context* nvfx;
- struct pipe_shader_state pipe;
- struct nvfx_vertex_program *vp;
- struct tgsi_shader_info* info;
-
- struct nvfx_vertex_program_exec *vpi;
-
- unsigned r_temps;
- unsigned r_temps_discard;
- struct nvfx_reg r_result[PIPE_MAX_SHADER_OUTPUTS];
- struct nvfx_reg *r_address;
- struct nvfx_reg *r_temp;
- struct nvfx_reg *r_const;
- struct nvfx_reg r_0_1;
-
- struct nvfx_reg *imm;
- unsigned nr_imm;
-
- unsigned hpos_idx;
-
- struct util_dynarray label_relocs;
- struct util_dynarray loop_stack;
-};
-
-static struct nvfx_reg
-temp(struct nvfx_vpc *vpc)
-{
- int idx = ffs(~vpc->r_temps) - 1;
-
- if (idx < 0) {
- NOUVEAU_ERR("out of temps!!\n");
- assert(0);
- return nvfx_reg(NVFXSR_TEMP, 0);
- }
-
- vpc->r_temps |= (1 << idx);
- vpc->r_temps_discard |= (1 << idx);
- return nvfx_reg(NVFXSR_TEMP, idx);
-}
-
-static inline void
-release_temps(struct nvfx_vpc *vpc)
-{
- vpc->r_temps &= ~vpc->r_temps_discard;
- vpc->r_temps_discard = 0;
-}
-
-static struct nvfx_reg
-constant(struct nvfx_vpc *vpc, int pipe, float x, float y, float z, float w)
-{
- struct nvfx_vertex_program *vp = vpc->vp;
- struct nvfx_vertex_program_data *vpd;
- int idx;
-
- if (pipe >= 0) {
- for (idx = 0; idx < vp->nr_consts; idx++) {
- if (vp->consts[idx].index == pipe)
- return nvfx_reg(NVFXSR_CONST, idx);
- }
- }
-
- idx = vp->nr_consts++;
- vp->consts = realloc(vp->consts, sizeof(*vpd) * vp->nr_consts);
- vpd = &vp->consts[idx];
-
- vpd->index = pipe;
- vpd->value[0] = x;
- vpd->value[1] = y;
- vpd->value[2] = z;
- vpd->value[3] = w;
- return nvfx_reg(NVFXSR_CONST, idx);
-}
-
-#define arith(s,t,o,d,m,s0,s1,s2) \
- nvfx_insn((s), (NVFX_VP_INST_SLOT_##t << 7) | NVFX_VP_INST_##t##_OP_##o, -1, (d), (m), (s0), (s1), (s2))
-
-static void
-emit_src(struct nvfx_context* nvfx, struct nvfx_vpc *vpc, uint32_t *hw, int pos, struct nvfx_src src)
-{
- struct nvfx_vertex_program *vp = vpc->vp;
- uint32_t sr = 0;
- struct nvfx_relocation reloc;
-
- switch (src.reg.type) {
- case NVFXSR_TEMP:
- sr |= (NVFX_VP(SRC_REG_TYPE_TEMP) << NVFX_VP(SRC_REG_TYPE_SHIFT));
- sr |= (src.reg.index << NVFX_VP(SRC_TEMP_SRC_SHIFT));
- break;
- case NVFXSR_INPUT:
- sr |= (NVFX_VP(SRC_REG_TYPE_INPUT) <<
- NVFX_VP(SRC_REG_TYPE_SHIFT));
- vp->ir |= (1 << src.reg.index);
- hw[1] |= (src.reg.index << NVFX_VP(INST_INPUT_SRC_SHIFT));
- break;
- case NVFXSR_CONST:
- sr |= (NVFX_VP(SRC_REG_TYPE_CONST) <<
- NVFX_VP(SRC_REG_TYPE_SHIFT));
- reloc.location = vp->nr_insns - 1;
- reloc.target = src.reg.index;
- util_dynarray_append(&vp->const_relocs, struct nvfx_relocation, reloc);
- break;
- case NVFXSR_NONE:
- sr |= (NVFX_VP(SRC_REG_TYPE_INPUT) <<
- NVFX_VP(SRC_REG_TYPE_SHIFT));
- break;
- default:
- assert(0);
- }
-
- if (src.negate)
- sr |= NVFX_VP(SRC_NEGATE);
-
- if (src.abs)
- hw[0] |= (1 << (21 + pos));
-
- sr |= ((src.swz[0] << NVFX_VP(SRC_SWZ_X_SHIFT)) |
- (src.swz[1] << NVFX_VP(SRC_SWZ_Y_SHIFT)) |
- (src.swz[2] << NVFX_VP(SRC_SWZ_Z_SHIFT)) |
- (src.swz[3] << NVFX_VP(SRC_SWZ_W_SHIFT)));
-
- if(src.indirect) {
- if(src.reg.type == NVFXSR_CONST)
- hw[3] |= NVFX_VP(INST_INDEX_CONST);
- else if(src.reg.type == NVFXSR_INPUT)
- hw[0] |= NVFX_VP(INST_INDEX_INPUT);
- else
- assert(0);
- if(src.indirect_reg)
- hw[0] |= NVFX_VP(INST_ADDR_REG_SELECT_1);
- hw[0] |= src.indirect_swz << NVFX_VP(INST_ADDR_SWZ_SHIFT);
- }
-
- switch (pos) {
- case 0:
- hw[1] |= ((sr & NVFX_VP(SRC0_HIGH_MASK)) >>
- NVFX_VP(SRC0_HIGH_SHIFT)) << NVFX_VP(INST_SRC0H_SHIFT);
- hw[2] |= (sr & NVFX_VP(SRC0_LOW_MASK)) <<
- NVFX_VP(INST_SRC0L_SHIFT);
- break;
- case 1:
- hw[2] |= sr << NVFX_VP(INST_SRC1_SHIFT);
- break;
- case 2:
- hw[2] |= ((sr & NVFX_VP(SRC2_HIGH_MASK)) >>
- NVFX_VP(SRC2_HIGH_SHIFT)) << NVFX_VP(INST_SRC2H_SHIFT);
- hw[3] |= (sr & NVFX_VP(SRC2_LOW_MASK)) <<
- NVFX_VP(INST_SRC2L_SHIFT);
- break;
- default:
- assert(0);
- }
-}
-
-static void
-emit_dst(struct nvfx_context* nvfx, struct nvfx_vpc *vpc, uint32_t *hw, int slot, struct nvfx_reg dst)
-{
- struct nvfx_vertex_program *vp = vpc->vp;
-
- switch (dst.type) {
- case NVFXSR_NONE:
- if(!nvfx->is_nv4x)
- hw[0] |= NV30_VP_INST_DEST_TEMP_ID_MASK;
- else {
- hw[3] |= NV40_VP_INST_DEST_MASK;
- if (slot == 0)
- hw[0] |= NV40_VP_INST_VEC_DEST_TEMP_MASK;
- else
- hw[3] |= NV40_VP_INST_SCA_DEST_TEMP_MASK;
- }
- break;
- case NVFXSR_TEMP:
- if(!nvfx->is_nv4x)
- hw[0] |= (dst.index << NV30_VP_INST_DEST_TEMP_ID_SHIFT);
- else {
- hw[3] |= NV40_VP_INST_DEST_MASK;
- if (slot == 0)
- hw[0] |= (dst.index << NV40_VP_INST_VEC_DEST_TEMP_SHIFT);
- else
- hw[3] |= (dst.index << NV40_VP_INST_SCA_DEST_TEMP_SHIFT);
- }
- break;
- case NVFXSR_OUTPUT:
- /* TODO: this may be wrong because on nv30 COL0 and BFC0 are swapped */
- if(nvfx->is_nv4x) {
- switch (dst.index) {
- case NV30_VP_INST_DEST_CLP(0):
- dst.index = NVFX_VP(INST_DEST_FOGC);
- break;
- case NV30_VP_INST_DEST_CLP(1):
- dst.index = NVFX_VP(INST_DEST_FOGC);
- break;
- case NV30_VP_INST_DEST_CLP(2):
- dst.index = NVFX_VP(INST_DEST_FOGC);
- break;
- case NV30_VP_INST_DEST_CLP(3):
- dst.index = NVFX_VP(INST_DEST_PSZ);
- break;
- case NV30_VP_INST_DEST_CLP(4):
- dst.index = NVFX_VP(INST_DEST_PSZ);
- break;
- case NV30_VP_INST_DEST_CLP(5):
- dst.index = NVFX_VP(INST_DEST_PSZ);
- break;
- case NV40_VP_INST_DEST_COL0 : vp->or |= (1 << 0); break;
- case NV40_VP_INST_DEST_COL1 : vp->or |= (1 << 1); break;
- case NV40_VP_INST_DEST_BFC0 : vp->or |= (1 << 2); break;
- case NV40_VP_INST_DEST_BFC1 : vp->or |= (1 << 3); break;
- case NV40_VP_INST_DEST_FOGC: vp->or |= (1 << 4); break;
- case NV40_VP_INST_DEST_PSZ : vp->or |= (1 << 5); break;
- }
- }
-
- if(!nvfx->is_nv4x) {
- hw[3] |= (dst.index << NV30_VP_INST_DEST_SHIFT);
- hw[0] |= NV30_VP_INST_VEC_DEST_TEMP_MASK;
-
- /*XXX: no way this is entirely correct, someone needs to
- * figure out what exactly it is.
- */
- hw[3] |= 0x800;
- } else {
- hw[3] |= (dst.index << NV40_VP_INST_DEST_SHIFT);
- if (slot == 0) {
- hw[0] |= NV40_VP_INST_VEC_RESULT;
- hw[0] |= NV40_VP_INST_VEC_DEST_TEMP_MASK;
- } else {
- hw[3] |= NV40_VP_INST_SCA_RESULT;
- hw[3] |= NV40_VP_INST_SCA_DEST_TEMP_MASK;
- }
- }
- break;
- default:
- assert(0);
- }
-}
-
-static void
-nvfx_vp_emit(struct nvfx_vpc *vpc, struct nvfx_insn insn)
-{
- struct nvfx_context* nvfx = vpc->nvfx;
- struct nvfx_vertex_program *vp = vpc->vp;
- unsigned slot = insn.op >> 7;
- unsigned op = insn.op & 0x7f;
- uint32_t *hw;
-
- vp->insns = realloc(vp->insns, ++vp->nr_insns * sizeof(*vpc->vpi));
- vpc->vpi = &vp->insns[vp->nr_insns - 1];
- memset(vpc->vpi, 0, sizeof(*vpc->vpi));
-
- hw = vpc->vpi->data;
-
- hw[0] |= (insn.cc_test << NVFX_VP(INST_COND_SHIFT));
- hw[0] |= ((insn.cc_swz[0] << NVFX_VP(INST_COND_SWZ_X_SHIFT)) |
- (insn.cc_swz[1] << NVFX_VP(INST_COND_SWZ_Y_SHIFT)) |
- (insn.cc_swz[2] << NVFX_VP(INST_COND_SWZ_Z_SHIFT)) |
- (insn.cc_swz[3] << NVFX_VP(INST_COND_SWZ_W_SHIFT)));
- if(insn.cc_update)
- hw[0] |= NVFX_VP(INST_COND_UPDATE_ENABLE);
-
- if(insn.sat)
- {
- assert(nvfx->use_nv4x);
- if(nvfx->use_nv4x)
- hw[0] |= NV40_VP_INST_SATURATE;
- }
-
- if(!nvfx->is_nv4x) {
- if(slot == 0)
- hw[1] |= (op << NV30_VP_INST_VEC_OPCODE_SHIFT);
- else
- {
- hw[0] |= ((op >> 4) << NV30_VP_INST_SCA_OPCODEH_SHIFT);
- hw[1] |= ((op & 0xf) << NV30_VP_INST_SCA_OPCODEL_SHIFT);
- }
-// hw[3] |= NVFX_VP(INST_SCA_DEST_TEMP_MASK);
-// hw[3] |= (mask << NVFX_VP(INST_VEC_WRITEMASK_SHIFT));
-
- if (insn.dst.type == NVFXSR_OUTPUT) {
- if (slot)
- hw[3] |= (insn.mask << NV30_VP_INST_SDEST_WRITEMASK_SHIFT);
- else
- hw[3] |= (insn.mask << NV30_VP_INST_VDEST_WRITEMASK_SHIFT);
- } else {
- if (slot)
- hw[3] |= (insn.mask << NV30_VP_INST_STEMP_WRITEMASK_SHIFT);
- else
- hw[3] |= (insn.mask << NV30_VP_INST_VTEMP_WRITEMASK_SHIFT);
- }
- } else {
- if (slot == 0) {
- hw[1] |= (op << NV40_VP_INST_VEC_OPCODE_SHIFT);
- hw[3] |= NV40_VP_INST_SCA_DEST_TEMP_MASK;
- hw[3] |= (insn.mask << NV40_VP_INST_VEC_WRITEMASK_SHIFT);
- } else {
- hw[1] |= (op << NV40_VP_INST_SCA_OPCODE_SHIFT);
- hw[0] |= NV40_VP_INST_VEC_DEST_TEMP_MASK ;
- hw[3] |= (insn.mask << NV40_VP_INST_SCA_WRITEMASK_SHIFT);
- }
- }
-
- emit_dst(nvfx, vpc, hw, slot, insn.dst);
- emit_src(nvfx, vpc, hw, 0, insn.src[0]);
- emit_src(nvfx, vpc, hw, 1, insn.src[1]);
- emit_src(nvfx, vpc, hw, 2, insn.src[2]);
-
-// if(insn.src[0].indirect || op == NVFX_VP_INST_VEC_OP_ARL)
-// hw[3] |= NV40_VP_INST_SCA_RESULT;
-}
-
-static inline struct nvfx_src
-tgsi_src(struct nvfx_vpc *vpc, const struct tgsi_full_src_register *fsrc) {
- struct nvfx_src src;
-
- switch (fsrc->Register.File) {
- case TGSI_FILE_INPUT:
- src.reg = nvfx_reg(NVFXSR_INPUT, fsrc->Register.Index);
- break;
- case TGSI_FILE_CONSTANT:
- src.reg = vpc->r_const[fsrc->Register.Index];
- break;
- case TGSI_FILE_IMMEDIATE:
- src.reg = vpc->imm[fsrc->Register.Index];
- break;
- case TGSI_FILE_TEMPORARY:
- src.reg = vpc->r_temp[fsrc->Register.Index];
- break;
- default:
- NOUVEAU_ERR("bad src file\n");
- src.reg.index = 0;
- src.reg.type = -1;
- break;
- }
-
- src.abs = fsrc->Register.Absolute;
- src.negate = fsrc->Register.Negate;
- src.swz[0] = fsrc->Register.SwizzleX;
- src.swz[1] = fsrc->Register.SwizzleY;
- src.swz[2] = fsrc->Register.SwizzleZ;
- src.swz[3] = fsrc->Register.SwizzleW;
- src.indirect = 0;
- src.indirect_reg = 0;
- src.indirect_swz = 0;
-
- if(fsrc->Register.Indirect) {
- if(fsrc->Indirect.File == TGSI_FILE_ADDRESS &&
- (fsrc->Register.File == TGSI_FILE_CONSTANT || fsrc->Register.File == TGSI_FILE_INPUT))
- {
- src.indirect = 1;
- src.indirect_reg = fsrc->Indirect.Index;
- src.indirect_swz = fsrc->Indirect.SwizzleX;
- }
- else
- {
- src.reg.index = 0;
- src.reg.type = -1;
- }
- }
- return src;
-}
-
-static INLINE struct nvfx_reg
-tgsi_dst(struct nvfx_vpc *vpc, const struct tgsi_full_dst_register *fdst) {
- struct nvfx_reg dst;
-
- switch (fdst->Register.File) {
- case TGSI_FILE_NULL:
- dst = nvfx_reg(NVFXSR_NONE, 0);
- break;
- case TGSI_FILE_OUTPUT:
- dst = vpc->r_result[fdst->Register.Index];
- break;
- case TGSI_FILE_TEMPORARY:
- dst = vpc->r_temp[fdst->Register.Index];
- break;
- case TGSI_FILE_ADDRESS:
- dst = vpc->r_address[fdst->Register.Index];
- break;
- default:
- NOUVEAU_ERR("bad dst file %i\n", fdst->Register.File);
- dst.index = 0;
- dst.type = 0;
- break;
- }
-
- return dst;
-}
-
-static inline int
-tgsi_mask(uint tgsi)
-{
- int mask = 0;
-
- if (tgsi & TGSI_WRITEMASK_X) mask |= NVFX_VP_MASK_X;
- if (tgsi & TGSI_WRITEMASK_Y) mask |= NVFX_VP_MASK_Y;
- if (tgsi & TGSI_WRITEMASK_Z) mask |= NVFX_VP_MASK_Z;
- if (tgsi & TGSI_WRITEMASK_W) mask |= NVFX_VP_MASK_W;
- return mask;
-}
-
-static boolean
-nvfx_vertprog_parse_instruction(struct nvfx_context* nvfx, struct nvfx_vpc *vpc,
- unsigned idx, const struct tgsi_full_instruction *finst)
-{
- struct nvfx_src src[3], tmp;
- struct nvfx_reg dst;
- struct nvfx_reg final_dst;
- struct nvfx_src none = nvfx_src(nvfx_reg(NVFXSR_NONE, 0));
- struct nvfx_insn insn;
- struct nvfx_relocation reloc;
- struct nvfx_loop_entry loop;
- boolean sat = FALSE;
- int mask;
- int ai = -1, ci = -1, ii = -1;
- int i;
- unsigned sub_depth = 0;
-
- for (i = 0; i < finst->Instruction.NumSrcRegs; i++) {
- const struct tgsi_full_src_register *fsrc;
-
- fsrc = &finst->Src[i];
- if (fsrc->Register.File == TGSI_FILE_TEMPORARY) {
- src[i] = tgsi_src(vpc, fsrc);
- }
- }
-
- for (i = 0; i < finst->Instruction.NumSrcRegs; i++) {
- const struct tgsi_full_src_register *fsrc;
-
- fsrc = &finst->Src[i];
-
- switch (fsrc->Register.File) {
- case TGSI_FILE_INPUT:
- if (ai == -1 || ai == fsrc->Register.Index) {
- ai = fsrc->Register.Index;
- src[i] = tgsi_src(vpc, fsrc);
- } else {
- src[i] = nvfx_src(temp(vpc));
- nvfx_vp_emit(vpc, arith(0, VEC, MOV, src[i].reg, NVFX_VP_MASK_ALL, tgsi_src(vpc, fsrc), none, none));
- }
- break;
- case TGSI_FILE_CONSTANT:
- if ((ci == -1 && ii == -1) ||
- ci == fsrc->Register.Index) {
- ci = fsrc->Register.Index;
- src[i] = tgsi_src(vpc, fsrc);
- } else {
- src[i] = nvfx_src(temp(vpc));
- nvfx_vp_emit(vpc, arith(0, VEC, MOV, src[i].reg, NVFX_VP_MASK_ALL, tgsi_src(vpc, fsrc), none, none));
- }
- break;
- case TGSI_FILE_IMMEDIATE:
- if ((ci == -1 && ii == -1) ||
- ii == fsrc->Register.Index) {
- ii = fsrc->Register.Index;
- src[i] = tgsi_src(vpc, fsrc);
- } else {
- src[i] = nvfx_src(temp(vpc));
- nvfx_vp_emit(vpc, arith(0, VEC, MOV, src[i].reg, NVFX_VP_MASK_ALL, tgsi_src(vpc, fsrc), none, none));
- }
- break;
- case TGSI_FILE_TEMPORARY:
- /* handled above */
- break;
- default:
- NOUVEAU_ERR("bad src file\n");
- return FALSE;
- }
- }
-
- for (i = 0; i < finst->Instruction.NumSrcRegs; i++) {
- if(src[i].reg.type < 0)
- return FALSE;
- }
-
- if(finst->Dst[0].Register.File == TGSI_FILE_ADDRESS &&
- finst->Instruction.Opcode != TGSI_OPCODE_ARL)
- return FALSE;
-
- final_dst = dst = tgsi_dst(vpc, &finst->Dst[0]);
- mask = tgsi_mask(finst->Dst[0].Register.WriteMask);
- if(finst->Instruction.Saturate == TGSI_SAT_ZERO_ONE)
- {
- assert(finst->Instruction.Opcode != TGSI_OPCODE_ARL);
- if(nvfx->use_nv4x)
- sat = TRUE;
- else if(dst.type != NVFXSR_TEMP)
- dst = temp(vpc);
- }
-
- switch (finst->Instruction.Opcode) {
- case TGSI_OPCODE_ABS:
- nvfx_vp_emit(vpc, arith(sat, VEC, MOV, dst, mask, abs(src[0]), none, none));
- break;
- case TGSI_OPCODE_ADD:
- nvfx_vp_emit(vpc, arith(sat, VEC, ADD, dst, mask, src[0], none, src[1]));
- break;
- case TGSI_OPCODE_ARL:
- nvfx_vp_emit(vpc, arith(0, VEC, ARL, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_CMP:
- insn = arith(0, VEC, MOV, none.reg, mask, src[0], none, none);
- insn.cc_update = 1;
- nvfx_vp_emit(vpc, insn);
-
- insn = arith(sat, VEC, MOV, dst, mask, src[2], none, none);
- insn.cc_test = NVFX_COND_GE;
- nvfx_vp_emit(vpc, insn);
-
- insn = arith(sat, VEC, MOV, dst, mask, src[1], none, none);
- insn.cc_test = NVFX_COND_LT;
- nvfx_vp_emit(vpc, insn);
- break;
- case TGSI_OPCODE_COS:
- nvfx_vp_emit(vpc, arith(sat, SCA, COS, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_DP2:
- tmp = nvfx_src(temp(vpc));
- nvfx_vp_emit(vpc, arith(0, VEC, MUL, tmp.reg, NVFX_VP_MASK_X | NVFX_VP_MASK_Y, src[0], src[1], none));
- nvfx_vp_emit(vpc, arith(sat, VEC, ADD, dst, mask, swz(tmp, X, X, X, X), none, swz(tmp, Y, Y, Y, Y)));
- break;
- case TGSI_OPCODE_DP3:
- nvfx_vp_emit(vpc, arith(sat, VEC, DP3, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_DP4:
- nvfx_vp_emit(vpc, arith(sat, VEC, DP4, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_DPH:
- nvfx_vp_emit(vpc, arith(sat, VEC, DPH, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_DST:
- nvfx_vp_emit(vpc, arith(sat, VEC, DST, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_EX2:
- nvfx_vp_emit(vpc, arith(sat, SCA, EX2, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_EXP:
- nvfx_vp_emit(vpc, arith(sat, SCA, EXP, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_FLR:
- nvfx_vp_emit(vpc, arith(sat, VEC, FLR, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_FRC:
- nvfx_vp_emit(vpc, arith(sat, VEC, FRC, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_LG2:
- nvfx_vp_emit(vpc, arith(sat, SCA, LG2, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_LIT:
- nvfx_vp_emit(vpc, arith(sat, SCA, LIT, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_LOG:
- nvfx_vp_emit(vpc, arith(sat, SCA, LOG, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_LRP:
- tmp = nvfx_src(temp(vpc));
- nvfx_vp_emit(vpc, arith(0, VEC, MAD, tmp.reg, mask, neg(src[0]), src[2], src[2]));
- nvfx_vp_emit(vpc, arith(sat, VEC, MAD, dst, mask, src[0], src[1], tmp));
- break;
- case TGSI_OPCODE_MAD:
- nvfx_vp_emit(vpc, arith(sat, VEC, MAD, dst, mask, src[0], src[1], src[2]));
- break;
- case TGSI_OPCODE_MAX:
- nvfx_vp_emit(vpc, arith(sat, VEC, MAX, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_MIN:
- nvfx_vp_emit(vpc, arith(sat, VEC, MIN, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_MOV:
- nvfx_vp_emit(vpc, arith(sat, VEC, MOV, dst, mask, src[0], none, none));
- break;
- case TGSI_OPCODE_MUL:
- nvfx_vp_emit(vpc, arith(sat, VEC, MUL, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_NOP:
- break;
- case TGSI_OPCODE_POW:
- tmp = nvfx_src(temp(vpc));
- nvfx_vp_emit(vpc, arith(0, SCA, LG2, tmp.reg, NVFX_VP_MASK_X, none, none, swz(src[0], X, X, X, X)));
- nvfx_vp_emit(vpc, arith(0, VEC, MUL, tmp.reg, NVFX_VP_MASK_X, swz(tmp, X, X, X, X), swz(src[1], X, X, X, X), none));
- nvfx_vp_emit(vpc, arith(sat, SCA, EX2, dst, mask, none, none, swz(tmp, X, X, X, X)));
- break;
- case TGSI_OPCODE_RCP:
- nvfx_vp_emit(vpc, arith(sat, SCA, RCP, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_RSQ:
- nvfx_vp_emit(vpc, arith(sat, SCA, RSQ, dst, mask, none, none, abs(src[0])));
- break;
- case TGSI_OPCODE_SEQ:
- nvfx_vp_emit(vpc, arith(sat, VEC, SEQ, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SFL:
- nvfx_vp_emit(vpc, arith(sat, VEC, SFL, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SGE:
- nvfx_vp_emit(vpc, arith(sat, VEC, SGE, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SGT:
- nvfx_vp_emit(vpc, arith(sat, VEC, SGT, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SIN:
- nvfx_vp_emit(vpc, arith(sat, SCA, SIN, dst, mask, none, none, src[0]));
- break;
- case TGSI_OPCODE_SLE:
- nvfx_vp_emit(vpc, arith(sat, VEC, SLE, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SLT:
- nvfx_vp_emit(vpc, arith(sat, VEC, SLT, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SNE:
- nvfx_vp_emit(vpc, arith(sat, VEC, SNE, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SSG:
- nvfx_vp_emit(vpc, arith(sat, VEC, SSG, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_STR:
- nvfx_vp_emit(vpc, arith(sat, VEC, STR, dst, mask, src[0], src[1], none));
- break;
- case TGSI_OPCODE_SUB:
- nvfx_vp_emit(vpc, arith(sat, VEC, ADD, dst, mask, src[0], none, neg(src[1])));
- break;
- case TGSI_OPCODE_TRUNC:
- tmp = nvfx_src(temp(vpc));
- insn = arith(0, VEC, MOV, none.reg, mask, src[0], none, none);
- insn.cc_update = 1;
- nvfx_vp_emit(vpc, insn);
-
- nvfx_vp_emit(vpc, arith(0, VEC, FLR, tmp.reg, mask, abs(src[0]), none, none));
- nvfx_vp_emit(vpc, arith(sat, VEC, MOV, dst, mask, tmp, none, none));
-
- insn = arith(sat, VEC, MOV, dst, mask, neg(tmp), none, none);
- insn.cc_test = NVFX_COND_LT;
- nvfx_vp_emit(vpc, insn);
- break;
- case TGSI_OPCODE_XPD:
- tmp = nvfx_src(temp(vpc));
- nvfx_vp_emit(vpc, arith(0, VEC, MUL, tmp.reg, mask, swz(src[0], Z, X, Y, Y), swz(src[1], Y, Z, X, X), none));
- nvfx_vp_emit(vpc, arith(sat, VEC, MAD, dst, (mask & ~NVFX_VP_MASK_W), swz(src[0], Y, Z, X, X), swz(src[1], Z, X, Y, Y), neg(tmp)));
- break;
-
- case TGSI_OPCODE_IF:
- insn = arith(0, VEC, MOV, none.reg, NVFX_VP_MASK_X, src[0], none, none);
- insn.cc_update = 1;
- nvfx_vp_emit(vpc, insn);
-
- reloc.location = vpc->vp->nr_insns;
- reloc.target = finst->Label.Label + 1;
- util_dynarray_append(&vpc->label_relocs, struct nvfx_relocation, reloc);
-
- insn = arith(0, SCA, BRA, none.reg, 0, none, none, none);
- insn.cc_test = NVFX_COND_EQ;
- insn.cc_swz[0] = insn.cc_swz[1] = insn.cc_swz[2] = insn.cc_swz[3] = 0;
- nvfx_vp_emit(vpc, insn);
- break;
-
- case TGSI_OPCODE_ELSE:
- case TGSI_OPCODE_BRA:
- case TGSI_OPCODE_CAL:
- reloc.location = vpc->vp->nr_insns;
- reloc.target = finst->Label.Label;
- util_dynarray_append(&vpc->label_relocs, struct nvfx_relocation, reloc);
-
- if(finst->Instruction.Opcode == TGSI_OPCODE_CAL)
- insn = arith(0, SCA, CAL, none.reg, 0, none, none, none);
- else
- insn = arith(0, SCA, BRA, none.reg, 0, none, none, none);
- nvfx_vp_emit(vpc, insn);
- break;
-
- case TGSI_OPCODE_RET:
- if(sub_depth || !nvfx->use_vp_clipping) {
- tmp = none;
- tmp.swz[0] = tmp.swz[1] = tmp.swz[2] = tmp.swz[3] = 0;
- nvfx_vp_emit(vpc, arith(0, SCA, RET, none.reg, 0, none, none, tmp));
- } else {
- reloc.location = vpc->vp->nr_insns;
- reloc.target = vpc->info->num_instructions;
- util_dynarray_append(&vpc->label_relocs, struct nvfx_relocation, reloc);
- nvfx_vp_emit(vpc, arith(0, SCA, BRA, none.reg, 0, none, none, none));
- }
- break;
-
- case TGSI_OPCODE_BGNSUB:
- ++sub_depth;
- break;
- case TGSI_OPCODE_ENDSUB:
- --sub_depth;
- break;
- case TGSI_OPCODE_ENDIF:
- /* nothing to do here */
- break;
-
- case TGSI_OPCODE_BGNLOOP:
- loop.cont_target = idx;
- loop.brk_target = finst->Label.Label + 1;
- util_dynarray_append(&vpc->loop_stack, struct nvfx_loop_entry, loop);
- break;
-
- case TGSI_OPCODE_ENDLOOP:
- loop = util_dynarray_pop(&vpc->loop_stack, struct nvfx_loop_entry);
-
- reloc.location = vpc->vp->nr_insns;
- reloc.target = loop.cont_target;
- util_dynarray_append(&vpc->label_relocs, struct nvfx_relocation, reloc);
-
- nvfx_vp_emit(vpc, arith(0, SCA, BRA, none.reg, 0, none, none, none));
- break;
-
- case TGSI_OPCODE_CONT:
- loop = util_dynarray_top(&vpc->loop_stack, struct nvfx_loop_entry);
-
- reloc.location = vpc->vp->nr_insns;
- reloc.target = loop.cont_target;
- util_dynarray_append(&vpc->label_relocs, struct nvfx_relocation, reloc);
-
- nvfx_vp_emit(vpc, arith(0, SCA, BRA, none.reg, 0, none, none, none));
- break;
-
- case TGSI_OPCODE_BRK:
- loop = util_dynarray_top(&vpc->loop_stack, struct nvfx_loop_entry);
-
- reloc.location = vpc->vp->nr_insns;
- reloc.target = loop.brk_target;
- util_dynarray_append(&vpc->label_relocs, struct nvfx_relocation, reloc);
-
- nvfx_vp_emit(vpc, arith(0, SCA, BRA, none.reg, 0, none, none, none));
- break;
-
- case TGSI_OPCODE_END:
- assert(!sub_depth);
- if(nvfx->use_vp_clipping) {
- if(idx != (vpc->info->num_instructions - 1)) {
- reloc.location = vpc->vp->nr_insns;
- reloc.target = vpc->info->num_instructions;
- util_dynarray_append(&vpc->label_relocs, struct nvfx_relocation, reloc);
- nvfx_vp_emit(vpc, arith(0, SCA, BRA, none.reg, 0, none, none, none));
- }
- } else {
- if(vpc->vp->nr_insns)
- vpc->vp->insns[vpc->vp->nr_insns - 1].data[3] |= NVFX_VP_INST_LAST;
- nvfx_vp_emit(vpc, arith(0, VEC, NOP, none.reg, 0, none, none, none));
- vpc->vp->insns[vpc->vp->nr_insns - 1].data[3] |= NVFX_VP_INST_LAST;
- }
- break;
-
- default:
- NOUVEAU_ERR("invalid opcode %d\n", finst->Instruction.Opcode);
- return FALSE;
- }
-
- if(finst->Instruction.Saturate == TGSI_SAT_ZERO_ONE && !nvfx->use_nv4x)
- {
- if(!vpc->r_0_1.type)
- vpc->r_0_1 = constant(vpc, -1, 0, 1, 0, 0);
- nvfx_vp_emit(vpc, arith(0, VEC, MAX, dst, mask, nvfx_src(dst), swz(nvfx_src(vpc->r_0_1), X, X, X, X), none));
- nvfx_vp_emit(vpc, arith(0, VEC, MIN, final_dst, mask, nvfx_src(dst), swz(nvfx_src(vpc->r_0_1), Y, Y, Y, Y), none));
- }
-
- release_temps(vpc);
- return TRUE;
-}
-
-static boolean
-nvfx_vertprog_parse_decl_output(struct nvfx_context* nvfx, struct nvfx_vpc *vpc,
- const struct tgsi_full_declaration *fdec)
-{
- unsigned idx = fdec->Range.First;
- int hw;
-
- switch (fdec->Semantic.Name) {
- case TGSI_SEMANTIC_POSITION:
- hw = NVFX_VP(INST_DEST_POS);
- vpc->hpos_idx = idx;
- break;
- case TGSI_SEMANTIC_COLOR:
- if (fdec->Semantic.Index == 0) {
- hw = NVFX_VP(INST_DEST_COL0);
- } else
- if (fdec->Semantic.Index == 1) {
- hw = NVFX_VP(INST_DEST_COL1);
- } else {
- NOUVEAU_ERR("bad colour semantic index\n");
- return FALSE;
- }
- break;
- case TGSI_SEMANTIC_BCOLOR:
- if (fdec->Semantic.Index == 0) {
- hw = NVFX_VP(INST_DEST_BFC0);
- } else
- if (fdec->Semantic.Index == 1) {
- hw = NVFX_VP(INST_DEST_BFC1);
- } else {
- NOUVEAU_ERR("bad bcolour semantic index\n");
- return FALSE;
- }
- break;
- case TGSI_SEMANTIC_FOG:
- hw = NVFX_VP(INST_DEST_FOGC);
- break;
- case TGSI_SEMANTIC_PSIZE:
- hw = NVFX_VP(INST_DEST_PSZ);
- break;
- case TGSI_SEMANTIC_GENERIC:
- hw = (vpc->vp->generic_to_fp_input[fdec->Semantic.Index] & 0xf) - NVFX_FP_OP_INPUT_SRC_TC(0);
- if(hw <= 8)
- hw = NVFX_VP(INST_DEST_TC(hw));
- else if(hw == 9) /* TODO: this is correct, but how does this overlapping work exactly? */
- hw = NV40_VP_INST_DEST_PSZ;
- else
- assert(0);
- break;
- case TGSI_SEMANTIC_EDGEFLAG:
- /* not really an error just a fallback */
- NOUVEAU_ERR("cannot handle edgeflag output\n");
- return FALSE;
- default:
- NOUVEAU_ERR("bad output semantic\n");
- return FALSE;
- }
-
- vpc->r_result[idx] = nvfx_reg(NVFXSR_OUTPUT, hw);
- return TRUE;
-}
-
-static boolean
-nvfx_vertprog_prepare(struct nvfx_context* nvfx, struct nvfx_vpc *vpc)
-{
- struct tgsi_parse_context p;
- int high_const = -1, high_temp = -1, high_addr = -1, nr_imm = 0, i;
- struct util_semantic_set set;
- unsigned char sem_layout[10];
- unsigned num_outputs;
- unsigned num_texcoords = nvfx->is_nv4x ? 10 : 8;
-
- num_outputs = util_semantic_set_from_program_file(&set, vpc->pipe.tokens, TGSI_FILE_OUTPUT);
-
- if(num_outputs > num_texcoords) {
- NOUVEAU_ERR("too many vertex program outputs: %i\n", num_outputs);
- return FALSE;
- }
- util_semantic_layout_from_set(sem_layout, &set, num_texcoords, num_texcoords);
-
- /* hope 0xf is (0, 0, 0, 1) initialized; otherwise, we are _probably_ not required to do this */
- memset(vpc->vp->generic_to_fp_input, 0x0f, sizeof(vpc->vp->generic_to_fp_input));
- for(int i = 0; i < num_texcoords; ++i) {
- if(sem_layout[i] == 0xff)
- continue;
- //printf("vp: GENERIC[%i] to fpreg %i\n", sem_layout[i], NVFX_FP_OP_INPUT_SRC_TC(0) + i);
- vpc->vp->generic_to_fp_input[sem_layout[i]] = 0xf0 | NVFX_FP_OP_INPUT_SRC_TC(i);
- }
-
- vpc->vp->sprite_fp_input = -1;
- for(int i = 0; i < num_texcoords; ++i)
- {
- if(sem_layout[i] == 0xff)
- {
- vpc->vp->sprite_fp_input = NVFX_FP_OP_INPUT_SRC_TC(i);
- break;
- }
- }
-
- tgsi_parse_init(&p, vpc->pipe.tokens);
- while (!tgsi_parse_end_of_tokens(&p)) {
- const union tgsi_full_token *tok = &p.FullToken;
-
- tgsi_parse_token(&p);
- switch(tok->Token.Type) {
- case TGSI_TOKEN_TYPE_IMMEDIATE:
- nr_imm++;
- break;
- case TGSI_TOKEN_TYPE_DECLARATION:
- {
- const struct tgsi_full_declaration *fdec;
-
- fdec = &p.FullToken.FullDeclaration;
- switch (fdec->Declaration.File) {
- case TGSI_FILE_TEMPORARY:
- if (fdec->Range.Last > high_temp) {
- high_temp =
- fdec->Range.Last;
- }
- break;
- case TGSI_FILE_ADDRESS:
- if (fdec->Range.Last > high_addr) {
- high_addr =
- fdec->Range.Last;
- }
- break;
- case TGSI_FILE_CONSTANT:
- if (fdec->Range.Last > high_const) {
- high_const =
- fdec->Range.Last;
- }
- break;
- case TGSI_FILE_OUTPUT:
- if (!nvfx_vertprog_parse_decl_output(nvfx, vpc, fdec))
- return FALSE;
- break;
- default:
- break;
- }
- }
- break;
- default:
- break;
- }
- }
- tgsi_parse_free(&p);
-
- if (nr_imm) {
- vpc->imm = CALLOC(nr_imm, sizeof(struct nvfx_reg));
- assert(vpc->imm);
- }
-
- if (++high_temp) {
- vpc->r_temp = CALLOC(high_temp, sizeof(struct nvfx_reg));
- for (i = 0; i < high_temp; i++)
- vpc->r_temp[i] = temp(vpc);
- }
-
- if (++high_addr) {
- vpc->r_address = CALLOC(high_addr, sizeof(struct nvfx_reg));
- for (i = 0; i < high_addr; i++)
- vpc->r_address[i] = nvfx_reg(NVFXSR_TEMP, i);
- }
-
- if(++high_const) {
- vpc->r_const = CALLOC(high_const, sizeof(struct nvfx_reg));
- for (i = 0; i < high_const; i++)
- vpc->r_const[i] = constant(vpc, i, 0, 0, 0, 0);
- }
-
- vpc->r_temps_discard = 0;
- return TRUE;
-}
-
-DEBUG_GET_ONCE_BOOL_OPTION(nvfx_dump_vp, "NVFX_DUMP_VP", FALSE)
-
-static struct nvfx_vertex_program*
-nvfx_vertprog_translate(struct nvfx_context *nvfx, const struct pipe_shader_state* vps, struct tgsi_shader_info* info)
-{
- struct tgsi_parse_context parse;
- struct nvfx_vertex_program* vp = NULL;
- struct nvfx_vpc *vpc = NULL;
- struct nvfx_src none = nvfx_src(nvfx_reg(NVFXSR_NONE, 0));
- struct util_dynarray insns;
- int i;
-
- tgsi_parse_init(&parse, vps->tokens);
-
- vp = CALLOC_STRUCT(nvfx_vertex_program);
- if(!vp)
- goto out_err;
-
- vpc = CALLOC_STRUCT(nvfx_vpc);
- if (!vpc)
- goto out_err;
-
- vpc->nvfx = nvfx;
- vpc->vp = vp;
- vpc->pipe = *vps;
- vpc->info = info;
-
- {
- // TODO: use a 64-bit atomic here!
- static unsigned long long id = 0;
- vp->id = ++id;
- }
-
- /* reserve space for ucps */
- if(nvfx->use_vp_clipping)
- {
- for(i = 0; i < 6; ++i)
- constant(vpc, -1, 0, 0, 0, 0);
- }
-
- if (!nvfx_vertprog_prepare(nvfx, vpc)) {
- FREE(vpc);
- return NULL;
- }
-
- /* Redirect post-transform vertex position to a temp if user clip
- * planes are enabled. We need to append code to the vtxprog
- * to handle clip planes later.
- */
- /* TODO: maybe support patching this depending on whether there are ucps: not sure if it is really matters much */
- if (nvfx->use_vp_clipping) {
- vpc->r_result[vpc->hpos_idx] = temp(vpc);
- vpc->r_temps_discard = 0;
- }
-
- util_dynarray_init(&insns);
- while (!tgsi_parse_end_of_tokens(&parse)) {
- tgsi_parse_token(&parse);
-
- switch (parse.FullToken.Token.Type) {
- case TGSI_TOKEN_TYPE_IMMEDIATE:
- {
- const struct tgsi_full_immediate *imm;
-
- imm = &parse.FullToken.FullImmediate;
- assert(imm->Immediate.DataType == TGSI_IMM_FLOAT32);
- assert(imm->Immediate.NrTokens == 4 + 1);
- vpc->imm[vpc->nr_imm++] =
- constant(vpc, -1,
- imm->u[0].Float,
- imm->u[1].Float,
- imm->u[2].Float,
- imm->u[3].Float);
- }
- break;
- case TGSI_TOKEN_TYPE_INSTRUCTION:
- {
- const struct tgsi_full_instruction *finst;
- unsigned idx = insns.size >> 2;
- util_dynarray_append(&insns, unsigned, vp->nr_insns);
- finst = &parse.FullToken.FullInstruction;
- if (!nvfx_vertprog_parse_instruction(nvfx, vpc, idx, finst))
- goto out_err;
- }
- break;
- default:
- break;
- }
- }
-
- util_dynarray_append(&insns, unsigned, vp->nr_insns);
-
- for(unsigned i = 0; i < vpc->label_relocs.size; i += sizeof(struct nvfx_relocation))
- {
- struct nvfx_relocation* label_reloc = (struct nvfx_relocation*)((char*)vpc->label_relocs.data + i);
- struct nvfx_relocation hw_reloc;
-
- hw_reloc.location = label_reloc->location;
- hw_reloc.target = ((unsigned*)insns.data)[label_reloc->target];
-
- //debug_printf("hw %u -> tgsi %u = hw %u\n", hw_reloc.location, label_reloc->target, hw_reloc.target);
-
- util_dynarray_append(&vp->branch_relocs, struct nvfx_relocation, hw_reloc);
- }
- util_dynarray_fini(&insns);
- util_dynarray_trim(&vp->branch_relocs);
-
- /* XXX: what if we add a RET before?! make sure we jump here...*/
-
- /* Write out HPOS if it was redirected to a temp earlier */
- if (vpc->r_result[vpc->hpos_idx].type != NVFXSR_OUTPUT) {
- struct nvfx_reg hpos = nvfx_reg(NVFXSR_OUTPUT,
- NVFX_VP(INST_DEST_POS));
- struct nvfx_src htmp = nvfx_src(vpc->r_result[vpc->hpos_idx]);
-
- nvfx_vp_emit(vpc, arith(0, VEC, MOV, hpos, NVFX_VP_MASK_ALL, htmp, none, none));
- }
-
- /* Insert code to handle user clip planes */
- if(nvfx->use_vp_clipping)
- {
- for (i = 0; i < 6; i++) {
- struct nvfx_reg cdst = nvfx_reg(NVFXSR_OUTPUT, NV30_VP_INST_DEST_CLP(i));
- struct nvfx_src ceqn = nvfx_src(nvfx_reg(NVFXSR_CONST, i));
- struct nvfx_src htmp = nvfx_src(vpc->r_result[vpc->hpos_idx]);
- unsigned mask;
-
- if(nvfx->is_nv4x)
- {
- switch (i) {
- case 0: case 3: mask = NVFX_VP_MASK_Y; break;
- case 1: case 4: mask = NVFX_VP_MASK_Z; break;
- case 2: case 5: mask = NVFX_VP_MASK_W; break;
- default:
- NOUVEAU_ERR("invalid clip dist #%d\n", i);
- goto out_err;
- }
- }
- else
- mask = NVFX_VP_MASK_X;
-
- nvfx_vp_emit(vpc, arith(0, VEC, DP4, cdst, mask, htmp, ceqn, none));
- }
- }
-
- if(debug_get_option_nvfx_dump_vp())
- {
- debug_printf("\n");
- tgsi_dump(vpc->pipe.tokens, 0);
-
- debug_printf("\n%s vertex program:\n", nvfx->is_nv4x ? "nv4x" : "nv3x");
- for (i = 0; i < vp->nr_insns; i++)
- debug_printf("%3u: %08x %08x %08x %08x\n", i, vp->insns[i].data[0], vp->insns[i].data[1], vp->insns[i].data[2], vp->insns[i].data[3]);
- debug_printf("\n");
- }
-
- vp->clip_nr = -1;
- vp->exec_start = -1;
-
-out:
- tgsi_parse_free(&parse);
- if(vpc) {
- util_dynarray_fini(&vpc->label_relocs);
- util_dynarray_fini(&vpc->loop_stack);
- FREE(vpc->r_temp);
- FREE(vpc->r_address);
- FREE(vpc->r_const);
- FREE(vpc->imm);
- FREE(vpc);
- }
- return vp;
-
-out_err:
- FREE(vp);
- vp = NULL;
- goto out;
-}
-
-static struct nvfx_vertex_program*
-nvfx_vertprog_translate_draw_vp(struct nvfx_context *nvfx, struct nvfx_pipe_vertex_program* pvp)
-{
- struct nvfx_vertex_program* vp = NULL;
- struct pipe_shader_state vps;
- struct tgsi_shader_info info;
- struct ureg_program *ureg = NULL;
- unsigned num_outputs = MIN2(pvp->info.num_outputs, 16);
-
- ureg = ureg_create( TGSI_PROCESSOR_VERTEX );
- if(ureg == NULL)
- return 0;
-
- for (unsigned i = 0; i < num_outputs; i++)
- ureg_MOV(ureg, ureg_DECL_output(ureg, pvp->info.output_semantic_name[i], pvp->info.output_semantic_index[i]), ureg_DECL_vs_input(ureg, i));
-
- ureg_END( ureg );
-
- vps.tokens = ureg_get_tokens(ureg, 0);
- tgsi_scan_shader(vps.tokens, &info);
- vp = nvfx_vertprog_translate(nvfx, &vps, &info);
- ureg_free_tokens(vps.tokens);
- ureg_destroy(ureg);
-
- return vp;
-}
-
-boolean
-nvfx_vertprog_validate(struct nvfx_context *nvfx)
-{
- struct nvfx_screen *screen = nvfx->screen;
- struct nouveau_channel *chan = screen->base.channel;
- struct nouveau_grobj *eng3d = screen->eng3d;
- struct nvfx_pipe_vertex_program *pvp = nvfx->vertprog;
- struct nvfx_vertex_program* vp;
- struct pipe_resource *constbuf;
- boolean upload_code = FALSE, upload_data = FALSE;
- int i;
-
- if (nvfx->render_mode == HW) {
- nvfx->fallback_swtnl &= ~NVFX_NEW_VERTPROG;
- vp = pvp->vp;
-
- if(!vp) {
- vp = nvfx_vertprog_translate(nvfx, &pvp->pipe, &pvp->info);
- if(!vp)
- vp = NVFX_VP_FAILED;
- pvp->vp = vp;
- }
-
- if(vp == NVFX_VP_FAILED) {
- nvfx->fallback_swtnl |= NVFX_NEW_VERTPROG;
- return FALSE;
- }
-
- constbuf = nvfx->constbuf[PIPE_SHADER_VERTEX];
- } else {
- vp = pvp->draw_vp;
- if(!vp)
- {
- pvp->draw_vp = vp = nvfx_vertprog_translate_draw_vp(nvfx, pvp);
- if(!vp) {
- _debug_printf("Error: unable to create a swtnl passthrough vertex shader: aborting.");
- abort();
- }
- }
- constbuf = NULL;
- }
-
- nvfx->hw_vertprog = vp;
-
- /* Allocate hw vtxprog exec slots */
- if (!vp->exec) {
- struct nouveau_resource *heap = nvfx->screen->vp_exec_heap;
- uint vplen = vp->nr_insns;
-
- if (nouveau_resource_alloc(heap, vplen, vp, &vp->exec)) {
- while (heap->next && heap->size < vplen) {
- struct nvfx_vertex_program *evict;
-
- evict = heap->next->priv;
- nouveau_resource_free(&evict->exec);
- }
-
- if (nouveau_resource_alloc(heap, vplen, vp, &vp->exec))
- {
- debug_printf("Vertex shader too long: %u instructions\n", vplen);
- nvfx->fallback_swtnl |= NVFX_NEW_VERTPROG;
- return FALSE;
- }
- }
-
- upload_code = TRUE;
- }
-
- /* Allocate hw vtxprog const slots */
- if (vp->nr_consts && !vp->data) {
- struct nouveau_resource *heap = nvfx->screen->vp_data_heap;
-
- if (nouveau_resource_alloc(heap, vp->nr_consts, vp, &vp->data)) {
- while (heap->next && heap->size < vp->nr_consts) {
- struct nvfx_vertex_program *evict;
-
- evict = heap->next->priv;
- nouveau_resource_free(&evict->data);
- }
-
- if (nouveau_resource_alloc(heap, vp->nr_consts, vp, &vp->data))
- {
- debug_printf("Vertex shader uses too many constants: %u constants\n", vp->nr_consts);
- nvfx->fallback_swtnl |= NVFX_NEW_VERTPROG;
- return FALSE;
- }
- }
-
- //printf("start at %u nc %u\n", vp->data->start, vp->nr_consts);
-
- /*XXX: handle this some day */
- assert(vp->data->start >= vp->data_start_min);
-
- upload_data = TRUE;
- if (vp->data_start != vp->data->start)
- upload_code = TRUE;
- }
-
- /* If exec or data segments moved we need to patch the program to
- * fixup offsets and register IDs.
- */
- if (vp->exec_start != vp->exec->start) {
- //printf("vp_relocs %u -> %u\n", vp->exec_start, vp->exec->start);
- for(unsigned i = 0; i < vp->branch_relocs.size; i += sizeof(struct nvfx_relocation))
- {
- struct nvfx_relocation* reloc = (struct nvfx_relocation*)((char*)vp->branch_relocs.data + i);
- uint32_t* hw = vp->insns[reloc->location].data;
- unsigned target = vp->exec->start + reloc->target;
-
- //debug_printf("vp_reloc hw %u -> hw %u\n", reloc->location, target);
-
- if(!nvfx->is_nv4x)
- {
- hw[2] &=~ NV30_VP_INST_IADDR_MASK;
- hw[2] |= (target & 0x1ff) << NV30_VP_INST_IADDR_SHIFT;
- }
- else
- {
- hw[3] &=~ NV40_VP_INST_IADDRL_MASK;
- hw[3] |= (target & 7) << NV40_VP_INST_IADDRL_SHIFT;
-
- hw[2] &=~ NV40_VP_INST_IADDRH_MASK;
- hw[2] |= ((target >> 3) & 0x3f) << NV40_VP_INST_IADDRH_SHIFT;
- }
- }
-
- vp->exec_start = vp->exec->start;
- }
-
- if (vp->data_start != vp->data->start) {
- for(unsigned i = 0; i < vp->const_relocs.size; i += sizeof(struct nvfx_relocation))
- {
- struct nvfx_relocation* reloc = (struct nvfx_relocation*)((char*)vp->const_relocs.data + i);
- struct nvfx_vertex_program_exec *vpi = &vp->insns[reloc->location];
-
- //printf("reloc %i to %i + %i\n", reloc->location, vp->data->start, reloc->target);
-
- vpi->data[1] &= ~NVFX_VP(INST_CONST_SRC_MASK);
- vpi->data[1] |=
- (reloc->target + vp->data->start) <<
- NVFX_VP(INST_CONST_SRC_SHIFT);
- }
-
- vp->data_start = vp->data->start;
- upload_code = TRUE;
- }
-
- /* Update + Upload constant values */
- if (vp->nr_consts) {
- float *map = NULL;
-
- if (constbuf)
- map = (float*)nvfx_buffer(constbuf)->data;
-
- /*
- * WAIT_RING(chan, 512 * 6);
- for (i = 0; i < 512; i++) {
- float v[4] = {0.1, 0,2, 0.3, 0.4};
- OUT_RING(chan, RING_3D(NV30_3D_VP_UPLOAD_CONST_ID, 5));
- OUT_RING(chan, i);
- OUT_RINGp(chan, (uint32_t *)v, 4);
- printf("frob %i\n", i);
- }
- */
-
- for (i = nvfx->use_vp_clipping ? 6 : 0; i < vp->nr_consts; i++) {
- struct nvfx_vertex_program_data *vpd = &vp->consts[i];
-
- if (vpd->index >= 0) {
- if (!upload_data &&
- !memcmp(vpd->value, &map[vpd->index * 4],
- 4 * sizeof(float)))
- continue;
- memcpy(vpd->value, &map[vpd->index * 4],
- 4 * sizeof(float));
- }
-
- //printf("upload into %i + %i: %f %f %f %f\n", vp->data->start, i, vpd->value[0], vpd->value[1], vpd->value[2], vpd->value[3]);
-
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_CONST_ID, 5);
- OUT_RING(chan, i + vp->data->start);
- OUT_RINGp(chan, (uint32_t *)vpd->value, 4);
- }
- }
-
- /* Upload vtxprog */
- if (upload_code) {
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_FROM_ID, 1);
- OUT_RING(chan, vp->exec->start);
- for (i = 0; i < vp->nr_insns; i++) {
- BEGIN_RING(chan, eng3d, NV30_3D_VP_UPLOAD_INST(0), 4);
- //printf("%08x %08x %08x %08x\n", vp->insns[i].data[0], vp->insns[i].data[1], vp->insns[i].data[2], vp->insns[i].data[3]);
- OUT_RINGp(chan, vp->insns[i].data, 4);
- }
- vp->clip_nr = -1;
- }
-
- if(nvfx->dirty & (NVFX_NEW_VERTPROG))
- {
- BEGIN_RING(chan, eng3d, NV30_3D_VP_START_FROM_ID, 1);
- OUT_RING(chan, vp->exec->start);
- if(nvfx->is_nv4x) {
- BEGIN_RING(chan, eng3d, NV40_3D_VP_ATTRIB_EN, 1);
- OUT_RING(chan, vp->ir);
- }
- }
-
- return TRUE;
-}
-
-void
-nvfx_vertprog_destroy(struct nvfx_context *nvfx, struct nvfx_vertex_program *vp)
-{
- if (vp->nr_insns)
- FREE(vp->insns);
-
- if (vp->nr_consts)
- FREE(vp->consts);
-
- nouveau_resource_free(&vp->exec);
- nouveau_resource_free(&vp->data);
-
- util_dynarray_fini(&vp->branch_relocs);
- util_dynarray_fini(&vp->const_relocs);
- FREE(vp);
-}
-
-static void *
-nvfx_vp_state_create(struct pipe_context *pipe, const struct pipe_shader_state *cso)
-{
- struct nvfx_pipe_vertex_program *pvp;
-
- pvp = CALLOC(1, sizeof(struct nvfx_pipe_vertex_program));
- pvp->pipe.tokens = tgsi_dup_tokens(cso->tokens);
- tgsi_scan_shader(pvp->pipe.tokens, &pvp->info);
- pvp->draw_elements = MAX2(1, MIN2(pvp->info.num_outputs, 16));
- pvp->draw_no_elements = pvp->info.num_outputs == 0;
-
- return (void *)pvp;
-}
-
-static void
-nvfx_vp_state_bind(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
-
- nvfx->vertprog = hwcso;
- nvfx->dirty |= NVFX_NEW_VERTPROG;
- nvfx->draw_dirty |= NVFX_NEW_VERTPROG;
-}
-
-static void
-nvfx_vp_state_delete(struct pipe_context *pipe, void *hwcso)
-{
- struct nvfx_context *nvfx = nvfx_context(pipe);
- struct nvfx_pipe_vertex_program *pvp = hwcso;
-
- if(pvp->draw_vs)
- draw_delete_vertex_shader(nvfx->draw, pvp->draw_vs);
- if(pvp->vp && pvp->vp != NVFX_VP_FAILED)
- nvfx_vertprog_destroy(nvfx, pvp->vp);
- if(pvp->draw_vp)
- nvfx_vertprog_destroy(nvfx, pvp->draw_vp);
- FREE((void*)pvp->pipe.tokens);
- FREE(pvp);
-}
-
-void
-nvfx_init_vertprog_functions(struct nvfx_context *nvfx)
-{
- nvfx->pipe.create_vs_state = nvfx_vp_state_create;
- nvfx->pipe.bind_vs_state = nvfx_vp_state_bind;
- nvfx->pipe.delete_vs_state = nvfx_vp_state_delete;
-}
$(TOP)/src/gallium/winsys/nouveau/drm/libnouveaudrm.a \
$(TOP)/src/gallium/drivers/trace/libtrace.a \
$(TOP)/src/gallium/drivers/rbug/librbug.a \
- $(TOP)/src/gallium/drivers/nvfx/libnvfx.a \
$(TOP)/src/gallium/drivers/nv50/libnv50.a \
$(TOP)/src/gallium/drivers/nvc0/libnvc0.a \
$(TOP)/src/gallium/drivers/nouveau/libnouveau.a
PIPE_DRIVERS = \
$(TOP)/src/gallium/winsys/nouveau/drm/libnouveaudrm.a \
- $(TOP)/src/gallium/drivers/nvfx/libnvfx.a \
$(TOP)/src/gallium/drivers/nv50/libnv50.a \
$(TOP)/src/gallium/drivers/nvc0/libnvc0.a \
$(TOP)/src/gallium/drivers/nouveau/libnouveau.a \
DRIVER_PIPES = \
$(TOP)/src/gallium/state_trackers/xorg/libxorgtracker.a \
$(TOP)/src/gallium/winsys/nouveau/drm/libnouveaudrm.a \
- $(TOP)/src/gallium/drivers/nvfx/libnvfx.a \
$(TOP)/src/gallium/drivers/nv50/libnv50.a \
$(TOP)/src/gallium/drivers/nvc0/libnvc0.a \
$(TOP)/src/gallium/drivers/nouveau/libnouveau.a \
PIPE_DRIVERS = \
$(TOP)/src/gallium/winsys/nouveau/drm/libnouveaudrm.a \
- $(TOP)/src/gallium/drivers/nvfx/libnvfx.a \
$(TOP)/src/gallium/drivers/nv50/libnv50.a \
$(TOP)/src/gallium/drivers/nvc0/libnvc0.a \
$(TOP)/src/gallium/drivers/nouveau/libnouveau.a \
return NULL;
switch (dev->chipset & 0xf0) {
+#if 0
case 0x30:
case 0x40:
case 0x60:
- init = nvfx_screen_create;
+ init = nv30_screen_create;
break;
+#endif
case 0x50:
case 0x80:
case 0x90: