--- /dev/null
+/*
+ * Copyright (C) 2016 Miklós Máté
+ * Copyright (C) 2020 Google LLC
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a
+ * copy of this software and associated documentation files (the "Software"),
+ * to deal in the Software without restriction, including without limitation
+ * the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ * and/or sell copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
+ * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
+ * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
+ * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+#include "main/mtypes.h"
+#include "main/atifragshader.h"
+#include "main/errors.h"
+#include "program/prog_parameter.h"
+#include "program/prog_instruction.h"
+#include "program/prog_to_nir.h"
+
+#include "st_program.h"
+#include "st_atifs_to_nir.h"
+#include "compiler/nir/nir_builder.h"
+
+#define FOG_PARAMS_UNIFORM (MAX_NUM_FRAGMENT_CONSTANTS_ATI + 0)
+#define FOG_COLOR_UNIFORM (MAX_NUM_FRAGMENT_CONSTANTS_ATI + 1)
+
+/**
+ * Intermediate state used during shader translation.
+ */
+struct st_translate {
+ nir_builder *b;
+ struct ati_fragment_shader *atifs;
+ const struct st_fp_variant_key *key;
+
+ nir_ssa_def *temps[MAX_PROGRAM_TEMPS];
+
+ nir_variable *fragcolor;
+ nir_variable *constants;
+ nir_variable *samplers[MAX_TEXTURE_UNITS];
+
+ nir_ssa_def *inputs[VARYING_SLOT_MAX];
+
+ unsigned current_pass;
+
+ bool regs_written[MAX_NUM_PASSES_ATI][MAX_NUM_FRAGMENT_REGISTERS_ATI];
+
+ boolean error;
+};
+
+static nir_ssa_def *
+nir_channel_vec4(nir_builder *b, nir_ssa_def *src, unsigned channel)
+{
+ unsigned swizzle[4] = { channel, channel, channel, channel };
+ return nir_swizzle(b, src, swizzle, 4);
+}
+
+static nir_ssa_def *
+nir_imm_vec4_float(nir_builder *b, float f)
+{
+ return nir_channel_vec4(b, nir_imm_float(b, f), 0);
+}
+
+static nir_ssa_def *
+get_temp(struct st_translate *t, unsigned index)
+{
+ if (!t->temps[index])
+ t->temps[index] = nir_ssa_undef(t->b, 4, 32);
+ return t->temps[index];
+}
+
+static nir_ssa_def *
+apply_swizzle(struct st_translate *t,
+ struct nir_ssa_def *src, GLuint swizzle)
+{
+ /* From the ATI_fs spec:
+ *
+ * "Table 3.20 shows the <swizzle> modes:
+ *
+ * Coordinates Used for 1D or Coordinates Used for
+ * Swizzle 2D SampleMap and PassTexCoord 3D or cubemap SampleMap
+ * ------- ----------------------------- -----------------------
+ * SWIZZLE_STR_ATI (s, t, r, undefined) (s, t, r, undefined)
+ * SWIZZLE_STQ_ATI (s, t, q, undefined) (s, t, q, undefined)
+ * SWIZZLE_STR_DR_ATI (s/r, t/r, 1/r, undefined) (undefined)
+ * SWIZZLE_STQ_DQ_ATI (s/q, t/q, 1/q, undefined) (undefined)
+ */
+ if (swizzle == GL_SWIZZLE_STR_ATI) {
+ return src;
+ } else if (swizzle == GL_SWIZZLE_STQ_ATI) {
+ static unsigned xywz[4] = { 0, 1, 3, 2 };
+ return nir_swizzle(t->b, src, xywz, 4);
+ } else {
+ nir_ssa_def *rcp = nir_frcp(t->b, nir_channel(t->b, src,
+ swizzle == GL_SWIZZLE_STR_DR_ATI ? 2 : 3));
+
+ nir_ssa_def *st_mul = nir_fmul(t->b, nir_channels(t->b, src, 0x3), rcp);
+
+ return nir_vec4(t->b,
+ nir_channel(t->b, st_mul, 0),
+ nir_channel(t->b, st_mul, 1),
+ rcp,
+ rcp);
+ }
+}
+
+static nir_ssa_def *
+load_input(struct st_translate *t, gl_varying_slot slot)
+{
+ if (!t->inputs[slot]) {
+ nir_variable *var = nir_variable_create(t->b->shader, nir_var_shader_in,
+ slot == VARYING_SLOT_FOGC ?
+ glsl_float_type() : glsl_vec4_type(),
+ gl_varying_slot_name(slot));
+ var->data.location = slot;
+ var->data.interpolation = INTERP_MODE_NONE;
+
+ t->inputs[slot] = nir_load_var(t->b, var);
+ }
+
+ return t->inputs[slot];
+}
+
+static nir_ssa_def *
+atifs_load_uniform(struct st_translate *t, int index)
+{
+ nir_deref_instr *deref = nir_build_deref_array(t->b,
+ nir_build_deref_var(t->b, t->constants),
+ nir_imm_int(t->b, index));
+ return nir_load_deref(t->b, deref);
+}
+
+static struct nir_ssa_def *
+get_source(struct st_translate *t, GLenum src_type)
+{
+ if (src_type >= GL_REG_0_ATI && src_type <= GL_REG_5_ATI) {
+ if (t->regs_written[t->current_pass][src_type - GL_REG_0_ATI]) {
+ return get_temp(t, src_type - GL_REG_0_ATI);
+ } else {
+ return nir_imm_vec4_float(t->b, 0.0);
+ }
+ } else if (src_type >= GL_CON_0_ATI && src_type <= GL_CON_7_ATI) {
+ int index = src_type - GL_CON_0_ATI;
+ if (t->atifs->LocalConstDef & (1 << index)) {
+ return nir_imm_vec4(t->b,
+ t->atifs->Constants[index][0],
+ t->atifs->Constants[index][1],
+ t->atifs->Constants[index][2],
+ t->atifs->Constants[index][3]);
+ } else {
+ return atifs_load_uniform(t, index);
+ }
+ } else if (src_type == GL_ZERO) {
+ return nir_imm_vec4_float(t->b, 0.0);
+ } else if (src_type == GL_ONE) {
+ return nir_imm_vec4_float(t->b, 1.0);
+ } else if (src_type == GL_PRIMARY_COLOR_ARB) {
+ return load_input(t, VARYING_SLOT_COL0);
+ } else if (src_type == GL_SECONDARY_INTERPOLATOR_ATI) {
+ return load_input(t, VARYING_SLOT_COL1);
+ } else {
+ /* frontend prevents this */
+ unreachable("unknown source");
+ }
+}
+
+static nir_ssa_def *
+prepare_argument(struct st_translate *t, const struct atifs_instruction *inst,
+ const unsigned argId, bool alpha)
+{
+ if (argId >= inst->ArgCount[alpha]) {
+ _mesa_warning(0, "Using 0 for missing argument %d\n", argId);
+ return nir_imm_vec4_float(t->b, 0.0f);
+ }
+
+ const struct atifragshader_src_register *srcReg = &inst->SrcReg[alpha][argId];
+
+ nir_ssa_def *src = get_source(t, srcReg->Index);
+
+ switch (srcReg->argRep) {
+ case GL_NONE:
+ break;
+ case GL_RED:
+ src = nir_channel_vec4(t->b, src, 0);
+ break;
+ case GL_GREEN:
+ src = nir_channel_vec4(t->b, src, 1);
+ break;
+ case GL_BLUE:
+ src = nir_channel_vec4(t->b, src, 2);
+ break;
+ case GL_ALPHA:
+ src = nir_channel_vec4(t->b, src, 3);
+ break;
+ }
+
+ t->temps[MAX_NUM_FRAGMENT_REGISTERS_ATI + argId] = src;
+
+ if (srcReg->argMod & GL_COMP_BIT_ATI)
+ src = nir_fsub(t->b, nir_imm_vec4_float(t->b, 1.0), src);
+ if (srcReg->argMod & GL_BIAS_BIT_ATI)
+ src = nir_fadd(t->b, src, nir_imm_vec4_float(t->b, -0.5));
+ if (srcReg->argMod & GL_2X_BIT_ATI)
+ src = nir_fadd(t->b, src, src);
+ if (srcReg->argMod & GL_NEGATE_BIT_ATI)
+ src = nir_fneg(t->b, src);
+
+ return src;
+}
+
+static nir_ssa_def *
+emit_arith_inst(struct st_translate *t,
+ const struct atifs_instruction *inst,
+ bool alpha)
+{
+ nir_ssa_def *src[3] = {0};
+ for (int i = 0; i < inst->ArgCount[alpha]; i++)
+ src[i] = prepare_argument(t, inst, i, alpha);
+
+ switch (inst->Opcode[alpha]) {
+ case GL_MOV_ATI:
+ return src[0];
+
+ case GL_ADD_ATI:
+ return nir_fadd(t->b, src[0], src[1]);
+
+ case GL_SUB_ATI:
+ return nir_fsub(t->b, src[0], src[1]);
+
+ case GL_MUL_ATI:
+ return nir_fmul(t->b, src[0], src[1]);
+
+ case GL_MAD_ATI:
+ return nir_ffma(t->b, src[0], src[1], src[2]);
+
+ case GL_LERP_ATI:
+ return nir_flrp(t->b, src[2], src[1], src[0]);
+
+ case GL_CND_ATI:
+ return nir_bcsel(t->b,
+ nir_fge(t->b, nir_imm_vec4_float(t->b, 0.5), src[2]),
+ src[1],
+ src[0]);
+
+ case GL_CND0_ATI:
+ return nir_bcsel(t->b,
+ nir_fge(t->b, src[2], nir_imm_vec4_float(t->b, 0.0)),
+ src[0],
+ src[1]);
+
+ case GL_DOT2_ADD_ATI:
+ return nir_channel_vec4(t->b,
+ nir_fadd(t->b,
+ nir_fdot2(t->b, src[0], src[1]),
+ nir_channel(t->b, src[1], 2)),
+ 0);
+
+ case GL_DOT3_ATI:
+ return nir_channel_vec4(t->b, nir_fdot3(t->b,src[0], src[1]), 0);
+
+ case GL_DOT4_ATI:
+ return nir_channel_vec4(t->b, nir_fdot4(t->b,src[0], src[1]), 0);
+
+ default:
+ unreachable("Unknown ATI_fs opcode");
+ }
+}
+
+static nir_ssa_def *
+emit_dstmod(struct st_translate *t,
+ struct nir_ssa_def *dst, GLuint dstMod)
+{
+ switch (dstMod & ~GL_SATURATE_BIT_ATI) {
+ case GL_2X_BIT_ATI:
+ dst = nir_fmul_imm(t->b, dst, 2.0f);
+ break;
+ case GL_4X_BIT_ATI:
+ dst = nir_fmul_imm(t->b, dst, 4.0f);
+ break;
+ case GL_8X_BIT_ATI:
+ dst = nir_fmul_imm(t->b, dst, 8.0f);
+ break;
+ case GL_HALF_BIT_ATI:
+ dst = nir_fmul_imm(t->b, dst, 0.5f);
+ break;
+ case GL_QUARTER_BIT_ATI:
+ dst = nir_fmul_imm(t->b, dst, 0.25f);
+ break;
+ case GL_EIGHTH_BIT_ATI:
+ dst = nir_fmul_imm(t->b, dst, 0.125f);
+ break;
+ default:
+ break;
+ }
+
+ if (dstMod & GL_SATURATE_BIT_ATI)
+ dst = nir_fsat(t->b, dst);
+
+ return dst;
+}
+
+/**
+ * Compile one setup instruction to NIR instructions.
+ */
+static void
+compile_setupinst(struct st_translate *t,
+ const unsigned r,
+ const struct atifs_setupinst *texinst)
+{
+ if (!texinst->Opcode)
+ return;
+
+ GLuint pass_tex = texinst->src;
+
+ nir_ssa_def *coord;
+
+ if (pass_tex >= GL_TEXTURE0_ARB && pass_tex <= GL_TEXTURE7_ARB) {
+ unsigned attr = pass_tex - GL_TEXTURE0_ARB;
+
+ coord = load_input(t, VARYING_SLOT_TEX0 + attr);
+ } else if (pass_tex >= GL_REG_0_ATI && pass_tex <= GL_REG_5_ATI) {
+ unsigned reg = pass_tex - GL_REG_0_ATI;
+
+ /* the frontend already validated that REG is only allowed in second pass */
+ if (t->regs_written[0][reg]) {
+ coord = t->temps[reg];
+ } else {
+ coord = nir_imm_vec4_float(t->b, 0.0f);
+ }
+ } else {
+ coord = nir_ssa_undef(t->b, 4, 32);
+ }
+ coord = apply_swizzle(t, coord, texinst->swizzle);
+
+ if (texinst->Opcode == ATI_FRAGMENT_SHADER_SAMPLE_OP) {
+ nir_variable *tex_var = t->samplers[r];
+ if (!tex_var) {
+ bool is_array;
+ enum glsl_sampler_dim sampler_dim =
+ _mesa_texture_index_to_sampler_dim(t->key->texture_index[r], &is_array);
+ const struct glsl_type *sampler_type =
+ glsl_sampler_type(sampler_dim, false, false, GLSL_TYPE_FLOAT);
+
+ tex_var = nir_variable_create(t->b->shader, nir_var_uniform, sampler_type, "tex");
+ tex_var->data.binding = r;
+ tex_var->data.explicit_binding = true;
+ t->samplers[r] = tex_var;
+ }
+ nir_deref_instr *tex_deref = nir_build_deref_var(t->b, t->samplers[r]);
+
+ nir_tex_instr *tex = nir_tex_instr_create(t->b->shader, 3);
+ tex->op = nir_texop_tex;
+ tex->sampler_dim = glsl_get_sampler_dim(tex_var->type);
+ tex->dest_type = nir_type_float;
+ tex->coord_components =
+ glsl_get_sampler_dim_coordinate_components(tex->sampler_dim);
+
+ tex->src[0].src_type = nir_tex_src_texture_deref;
+ tex->src[0].src = nir_src_for_ssa(&tex_deref->dest.ssa);
+ tex->src[1].src_type = nir_tex_src_sampler_deref;
+ tex->src[1].src = nir_src_for_ssa(&tex_deref->dest.ssa);
+ tex->src[2].src_type = nir_tex_src_coord;
+ tex->src[2].src =
+ nir_src_for_ssa(nir_channels(t->b, coord,
+ (1 << tex->coord_components) - 1));
+
+ nir_ssa_dest_init(&tex->instr, &tex->dest, 4, 32, NULL);
+ nir_builder_instr_insert(t->b, &tex->instr);
+
+ t->temps[r] = &tex->dest.ssa;
+ } else if (texinst->Opcode == ATI_FRAGMENT_SHADER_PASS_OP) {
+ t->temps[r] = coord;
+ }
+
+ t->regs_written[t->current_pass][r] = true;
+}
+
+/**
+ * Compile one arithmetic operation COLOR&ALPHA pair into NIR instructions.
+ */
+static void
+compile_instruction(struct st_translate *t,
+ const struct atifs_instruction *inst)
+{
+ unsigned optype;
+
+ for (optype = 0; optype < 2; optype++) { /* color, alpha */
+ unsigned dstreg = inst->DstReg[optype].Index - GL_REG_0_ATI;
+
+ if (!inst->Opcode[optype])
+ continue;
+
+ /* Execute the op */
+ nir_ssa_def *result = emit_arith_inst(t, inst, optype);
+ result = emit_dstmod(t, result, inst->DstReg[optype].dstMod);
+
+ /* Do the writemask */
+ nir_const_value wrmask[4] = { 0 };
+ for (int i = 0; i < 4; i++) {
+ if (inst->DstReg[optype].dstMask & (1 << i))
+ wrmask[i].b = 1;
+ }
+
+ t->temps[dstreg] = nir_bcsel(t->b,
+ nir_build_imm(t->b, 4, 1, wrmask),
+ result,
+ get_temp(t, dstreg));
+ t->regs_written[t->current_pass][dstreg] = true;
+ }
+}
+
+
+/* Creates the uniform variable referencing the ATI_fragment_shader constants
+ * plus the optimized fog state.
+ */
+static void
+st_atifs_setup_uniforms(struct st_translate *t, struct gl_program *program)
+{
+ const struct glsl_type *type =
+ glsl_array_type(glsl_vec4_type(), program->Parameters->NumParameters, 0);
+ t->constants =
+ nir_variable_create(t->b->shader, nir_var_uniform, type,
+ "gl_ATI_fragment_shader_constants");
+}
+
+/**
+ * Called when a new variant is needed, we need to translate
+ * the ATI fragment shader to NIR
+ */
+nir_shader *
+st_translate_atifs_program(struct ati_fragment_shader *atifs,
+ const struct st_fp_variant_key *key,
+ struct gl_program *program,
+ const nir_shader_compiler_options *options)
+{
+ nir_builder b = nir_builder_init_simple_shader(MESA_SHADER_FRAGMENT, options, "ATI_fs");
+
+ struct st_translate translate = {
+ .atifs = atifs,
+ .b = &b,
+ .key = key,
+ };
+ struct st_translate *t = &translate;
+
+ /* Copy the shader_info from the gl_program */
+ t->b->shader->info = program->info;
+
+ nir_shader *s = t->b->shader;
+ s->info.name = ralloc_asprintf(s, "ATIFS%d", program->Id);
+
+ t->fragcolor = nir_variable_create(b.shader, nir_var_shader_out,
+ glsl_vec4_type(), "gl_FragColor");
+ t->fragcolor->data.location = FRAG_RESULT_COLOR;
+
+ st_atifs_setup_uniforms(t, program);
+
+ /* emit instructions */
+ for (unsigned pass = 0; pass < atifs->NumPasses; pass++) {
+ t->current_pass = pass;
+ for (unsigned r = 0; r < MAX_NUM_FRAGMENT_REGISTERS_ATI; r++) {
+ struct atifs_setupinst *texinst = &atifs->SetupInst[pass][r];
+ compile_setupinst(t, r, texinst);
+ }
+ for (unsigned i = 0; i < atifs->numArithInstr[pass]; i++) {
+ struct atifs_instruction *inst = &atifs->Instructions[pass][i];
+ compile_instruction(t, inst);
+ }
+ }
+
+ if (t->regs_written[atifs->NumPasses-1][0]) {
+ nir_ssa_def *color = t->temps[0];
+
+ if (key->fog) {
+ nir_ssa_def *fogc = load_input(t, VARYING_SLOT_FOGC);
+
+ nir_ssa_def *params = atifs_load_uniform(t, FOG_PARAMS_UNIFORM);
+
+ /* compute the 1 component fog factor f */
+ nir_ssa_def *f = NULL;
+ if (key->fog == FOG_LINEAR) {
+ f = nir_ffma(t->b, fogc,
+ nir_channel(t->b, params, 0),
+ nir_channel(t->b, params, 1));
+ } else if (key->fog == FOG_EXP) {
+ /* EXP formula: f = exp(-dens * z)
+ * with optimized parameters:
+ * f = MUL(fogcoord, oparams.z); f= EX2(-f)
+ */
+ f = nir_fmul(t->b, fogc, nir_channel(t->b, params, 2));
+ f = nir_fexp2(t->b, nir_fneg(t->b, f));
+ } else if (key->fog == FOG_EXP2) {
+ /* EXP2 formula: f = exp(-(dens * z)^2)
+ * with optimized parameters:
+ * f = MUL(fogcoord, oparams.w); f=MUL(f, f); f= EX2(-f)
+ */
+ f = nir_fmul(t->b, fogc, nir_channel(t->b, params, 3));
+ f = nir_fmul(t->b, f, f);
+ f = nir_fexp2(t->b, nir_fneg(t->b, f));
+ }
+ f = nir_fsat(t->b, f);
+
+ nir_ssa_def *fog_color = nir_flrp(t->b,
+ atifs_load_uniform(t, FOG_COLOR_UNIFORM),
+ color,
+ f);
+ color = nir_vec4(t->b,
+ nir_channel(t->b, fog_color, 0),
+ nir_channel(t->b, fog_color, 1),
+ nir_channel(t->b, fog_color, 2),
+ nir_channel(t->b, color, 3));
+ }
+
+ nir_store_var(t->b, t->fragcolor, color, 0xf);
+ }
+
+ return b.shader;
+}
+
+/**
+ * Called in ProgramStringNotify, we need to fill the metadata of the
+ * gl_program attached to the ati_fragment_shader
+ */
+void
+st_init_atifs_prog(struct gl_context *ctx, struct gl_program *prog)
+{
+ /* we know this is st_fragment_program, because of st_new_ati_fs() */
+ struct st_program *stfp = (struct st_program *) prog;
+ struct ati_fragment_shader *atifs = stfp->ati_fs;
+
+ unsigned pass, i, r, optype, arg;
+
+ static const gl_state_index16 fog_params_state[STATE_LENGTH] =
+ {STATE_INTERNAL, STATE_FOG_PARAMS_OPTIMIZED, 0, 0};
+ static const gl_state_index16 fog_color[STATE_LENGTH] =
+ {STATE_FOG_COLOR, 0, 0, 0};
+
+ prog->info.inputs_read = 0;
+ prog->info.outputs_written = BITFIELD64_BIT(FRAG_RESULT_COLOR);
+ prog->SamplersUsed = 0;
+ prog->Parameters = _mesa_new_parameter_list();
+
+ /* fill in inputs_read, SamplersUsed, TexturesUsed */
+ for (pass = 0; pass < atifs->NumPasses; pass++) {
+ for (r = 0; r < MAX_NUM_FRAGMENT_REGISTERS_ATI; r++) {
+ struct atifs_setupinst *texinst = &atifs->SetupInst[pass][r];
+ GLuint pass_tex = texinst->src;
+
+ if (texinst->Opcode == ATI_FRAGMENT_SHADER_SAMPLE_OP) {
+ /* mark which texcoords are used */
+ prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_TEX0 + pass_tex - GL_TEXTURE0_ARB);
+ /* by default there is 1:1 mapping between samplers and textures */
+ prog->SamplersUsed |= (1 << r);
+ /* the target is unknown here, it will be fixed in the draw call */
+ prog->TexturesUsed[r] = TEXTURE_2D_BIT;
+ } else if (texinst->Opcode == ATI_FRAGMENT_SHADER_PASS_OP) {
+ if (pass_tex >= GL_TEXTURE0_ARB && pass_tex <= GL_TEXTURE7_ARB) {
+ prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_TEX0 + pass_tex - GL_TEXTURE0_ARB);
+ }
+ }
+ }
+ }
+ for (pass = 0; pass < atifs->NumPasses; pass++) {
+ for (i = 0; i < atifs->numArithInstr[pass]; i++) {
+ struct atifs_instruction *inst = &atifs->Instructions[pass][i];
+
+ for (optype = 0; optype < 2; optype++) { /* color, alpha */
+ if (inst->Opcode[optype]) {
+ for (arg = 0; arg < inst->ArgCount[optype]; arg++) {
+ GLint index = inst->SrcReg[optype][arg].Index;
+ if (index == GL_PRIMARY_COLOR_EXT) {
+ prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_COL0);
+ } else if (index == GL_SECONDARY_INTERPOLATOR_ATI) {
+ /* note: ATI_fragment_shader.txt never specifies what
+ * GL_SECONDARY_INTERPOLATOR_ATI is, swrast uses
+ * VARYING_SLOT_COL1 for this input */
+ prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_COL1);
+ }
+ }
+ }
+ }
+ }
+ }
+ /* we may need fog */
+ prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_FOGC);
+
+ /* we always have the ATI_fs constants, and the fog params */
+ for (i = 0; i < MAX_NUM_FRAGMENT_CONSTANTS_ATI; i++) {
+ _mesa_add_parameter(prog->Parameters, PROGRAM_UNIFORM,
+ NULL, 4, GL_FLOAT, NULL, NULL, true);
+ }
+ ASSERTED uint32_t ref;
+ ref = _mesa_add_state_reference(prog->Parameters, fog_params_state);
+ assert(ref == FOG_PARAMS_UNIFORM);
+ ref = _mesa_add_state_reference(prog->Parameters, fog_color);
+ assert(ref == FOG_COLOR_UNIFORM);
+}
+++ /dev/null
-/*
- * Copyright (C) 2016 Miklós Máté
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
- * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
- * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
- * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-#include "main/mtypes.h"
-#include "main/atifragshader.h"
-#include "main/errors.h"
-#include "program/prog_parameter.h"
-
-#include "tgsi/tgsi_ureg.h"
-#include "tgsi/tgsi_scan.h"
-#include "tgsi/tgsi_transform.h"
-
-#include "st_program.h"
-#include "st_atifs_to_tgsi.h"
-
-/**
- * Intermediate state used during shader translation.
- */
-struct st_translate {
- struct ureg_program *ureg;
- struct ati_fragment_shader *atifs;
-
- struct ureg_dst temps[MAX_PROGRAM_TEMPS];
- struct ureg_src *constants;
- struct ureg_dst outputs[PIPE_MAX_SHADER_OUTPUTS];
- struct ureg_src inputs[PIPE_MAX_SHADER_INPUTS];
- struct ureg_src samplers[PIPE_MAX_SAMPLERS];
-
- const ubyte *inputMapping;
- const ubyte *outputMapping;
-
- unsigned current_pass;
-
- bool regs_written[MAX_NUM_PASSES_ATI][MAX_NUM_FRAGMENT_REGISTERS_ATI];
-
- boolean error;
-};
-
-struct instruction_desc {
- unsigned TGSI_opcode;
- const char *name;
- unsigned char arg_count;
-};
-
-static const struct instruction_desc inst_desc[] = {
- {TGSI_OPCODE_MOV, "MOV", 1},
- {TGSI_OPCODE_NOP, "UND", 0}, /* unused */
- {TGSI_OPCODE_ADD, "ADD", 2},
- {TGSI_OPCODE_MUL, "MUL", 2},
- {TGSI_OPCODE_NOP, "SUB", 2},
- {TGSI_OPCODE_DP3, "DOT3", 2},
- {TGSI_OPCODE_DP4, "DOT4", 2},
- {TGSI_OPCODE_MAD, "MAD", 3},
- {TGSI_OPCODE_LRP, "LERP", 3},
- {TGSI_OPCODE_NOP, "CND", 3},
- {TGSI_OPCODE_NOP, "CND0", 3},
- {TGSI_OPCODE_NOP, "DOT2_ADD", 3}
-};
-
-static struct ureg_dst
-get_temp(struct st_translate *t, unsigned index)
-{
- if (ureg_dst_is_undef(t->temps[index]))
- t->temps[index] = ureg_DECL_temporary(t->ureg);
- return t->temps[index];
-}
-
-static struct ureg_src
-apply_swizzle(struct st_translate *t,
- struct ureg_src src, GLuint swizzle)
-{
- if (swizzle == GL_SWIZZLE_STR_ATI) {
- return src;
- } else if (swizzle == GL_SWIZZLE_STQ_ATI) {
- return ureg_swizzle(src,
- TGSI_SWIZZLE_X,
- TGSI_SWIZZLE_Y,
- TGSI_SWIZZLE_W,
- TGSI_SWIZZLE_Z);
- } else {
- struct ureg_dst tmp[2];
- struct ureg_src imm[3];
-
- tmp[0] = get_temp(t, MAX_NUM_FRAGMENT_REGISTERS_ATI);
- tmp[1] = get_temp(t, MAX_NUM_FRAGMENT_REGISTERS_ATI + 1);
- imm[0] = src;
- imm[1] = ureg_imm4f(t->ureg, 1.0f, 1.0f, 0.0f, 0.0f);
- imm[2] = ureg_imm4f(t->ureg, 0.0f, 0.0f, 1.0f, 1.0f);
- ureg_insn(t->ureg, TGSI_OPCODE_MAD, &tmp[0], 1, imm, 3, 0);
-
- if (swizzle == GL_SWIZZLE_STR_DR_ATI) {
- imm[0] = ureg_scalar(src, TGSI_SWIZZLE_Z);
- } else {
- imm[0] = ureg_scalar(src, TGSI_SWIZZLE_W);
- }
- ureg_insn(t->ureg, TGSI_OPCODE_RCP, &tmp[1], 1, &imm[0], 1, 0);
-
- imm[0] = ureg_src(tmp[0]);
- imm[1] = ureg_src(tmp[1]);
- ureg_insn(t->ureg, TGSI_OPCODE_MUL, &tmp[0], 1, imm, 2, 0);
-
- return ureg_src(tmp[0]);
- }
-}
-
-static struct ureg_src
-get_source(struct st_translate *t, GLuint src_type)
-{
- if (src_type >= GL_REG_0_ATI && src_type <= GL_REG_5_ATI) {
- if (t->regs_written[t->current_pass][src_type - GL_REG_0_ATI]) {
- return ureg_src(get_temp(t, src_type - GL_REG_0_ATI));
- } else {
- return ureg_imm1f(t->ureg, 0.0f);
- }
- } else if (src_type >= GL_CON_0_ATI && src_type <= GL_CON_7_ATI) {
- return t->constants[src_type - GL_CON_0_ATI];
- } else if (src_type == GL_ZERO) {
- return ureg_imm1f(t->ureg, 0.0f);
- } else if (src_type == GL_ONE) {
- return ureg_imm1f(t->ureg, 1.0f);
- } else if (src_type == GL_PRIMARY_COLOR_ARB) {
- return t->inputs[t->inputMapping[VARYING_SLOT_COL0]];
- } else if (src_type == GL_SECONDARY_INTERPOLATOR_ATI) {
- return t->inputs[t->inputMapping[VARYING_SLOT_COL1]];
- } else {
- /* frontend prevents this */
- unreachable("unknown source");
- }
-}
-
-static struct ureg_src
-prepare_argument(struct st_translate *t, const unsigned argId,
- const struct atifragshader_src_register *srcReg)
-{
- struct ureg_src src = get_source(t, srcReg->Index);
- struct ureg_dst arg = get_temp(t, MAX_NUM_FRAGMENT_REGISTERS_ATI + argId);
-
- switch (srcReg->argRep) {
- case GL_NONE:
- break;
- case GL_RED:
- src = ureg_scalar(src, TGSI_SWIZZLE_X);
- break;
- case GL_GREEN:
- src = ureg_scalar(src, TGSI_SWIZZLE_Y);
- break;
- case GL_BLUE:
- src = ureg_scalar(src, TGSI_SWIZZLE_Z);
- break;
- case GL_ALPHA:
- src = ureg_scalar(src, TGSI_SWIZZLE_W);
- break;
- }
- ureg_insn(t->ureg, TGSI_OPCODE_MOV, &arg, 1, &src, 1, 0);
-
- if (srcReg->argMod & GL_COMP_BIT_ATI) {
- struct ureg_src modsrc[2];
- modsrc[0] = ureg_imm1f(t->ureg, 1.0f);
- modsrc[1] = ureg_negate(ureg_src(arg));
-
- ureg_insn(t->ureg, TGSI_OPCODE_ADD, &arg, 1, modsrc, 2, 0);
- }
- if (srcReg->argMod & GL_BIAS_BIT_ATI) {
- struct ureg_src modsrc[2];
- modsrc[0] = ureg_src(arg);
- modsrc[1] = ureg_imm1f(t->ureg, -0.5f);
-
- ureg_insn(t->ureg, TGSI_OPCODE_ADD, &arg, 1, modsrc, 2, 0);
- }
- if (srcReg->argMod & GL_2X_BIT_ATI) {
- struct ureg_src modsrc[2];
- modsrc[0] = ureg_src(arg);
- modsrc[1] = ureg_src(arg);
-
- ureg_insn(t->ureg, TGSI_OPCODE_ADD, &arg, 1, modsrc, 2, 0);
- }
- if (srcReg->argMod & GL_NEGATE_BIT_ATI) {
- struct ureg_src modsrc[2];
- modsrc[0] = ureg_src(arg);
- modsrc[1] = ureg_imm1f(t->ureg, -1.0f);
-
- ureg_insn(t->ureg, TGSI_OPCODE_MUL, &arg, 1, modsrc, 2, 0);
- }
- return ureg_src(arg);
-}
-
-/* These instructions need special treatment */
-static void
-emit_special_inst(struct st_translate *t, const struct instruction_desc *desc,
- struct ureg_dst *dst, struct ureg_src *args, unsigned argcount)
-{
- struct ureg_dst tmp[1];
- struct ureg_src src[3];
-
- if (!strcmp(desc->name, "SUB")) {
- ureg_ADD(t->ureg, *dst, args[0], ureg_negate(args[1]));
- } else if (!strcmp(desc->name, "CND")) {
- tmp[0] = get_temp(t, MAX_NUM_FRAGMENT_REGISTERS_ATI + 2); /* re-purpose a3 */
- src[0] = ureg_imm1f(t->ureg, 0.5f);
- src[1] = ureg_negate(args[2]);
- ureg_insn(t->ureg, TGSI_OPCODE_ADD, tmp, 1, src, 2, 0);
- src[0] = ureg_src(tmp[0]);
- src[1] = args[0];
- src[2] = args[1];
- ureg_insn(t->ureg, TGSI_OPCODE_CMP, dst, 1, src, 3, 0);
- } else if (!strcmp(desc->name, "CND0")) {
- src[0] = args[2];
- src[1] = args[1];
- src[2] = args[0];
- ureg_insn(t->ureg, TGSI_OPCODE_CMP, dst, 1, src, 3, 0);
- } else if (!strcmp(desc->name, "DOT2_ADD")) {
- tmp[0] = get_temp(t, MAX_NUM_FRAGMENT_REGISTERS_ATI); /* re-purpose a1 */
- src[0] = args[0];
- src[1] = args[1];
- ureg_insn(t->ureg, TGSI_OPCODE_DP2, tmp, 1, src, 2, 0);
- src[0] = ureg_src(tmp[0]);
- src[1] = ureg_scalar(args[2], TGSI_SWIZZLE_Z);
- ureg_insn(t->ureg, TGSI_OPCODE_ADD, dst, 1, src, 2, 0);
- }
-}
-
-static void
-emit_arith_inst(struct st_translate *t,
- const struct instruction_desc *desc,
- struct ureg_dst *dst, struct ureg_src *args, unsigned argcount)
-{
- if (desc->TGSI_opcode == TGSI_OPCODE_NOP) {
- emit_special_inst(t, desc, dst, args, argcount);
- return;
- }
-
- ureg_insn(t->ureg, desc->TGSI_opcode, dst, 1, args, argcount, 0);
-}
-
-static void
-emit_dstmod(struct st_translate *t,
- struct ureg_dst dst, GLuint dstMod)
-{
- float imm;
- struct ureg_src src[3];
- GLuint scale = dstMod & ~GL_SATURATE_BIT_ATI;
-
- if (dstMod == GL_NONE) {
- return;
- }
-
- switch (scale) {
- case GL_2X_BIT_ATI:
- imm = 2.0f;
- break;
- case GL_4X_BIT_ATI:
- imm = 4.0f;
- break;
- case GL_8X_BIT_ATI:
- imm = 8.0f;
- break;
- case GL_HALF_BIT_ATI:
- imm = 0.5f;
- break;
- case GL_QUARTER_BIT_ATI:
- imm = 0.25f;
- break;
- case GL_EIGHTH_BIT_ATI:
- imm = 0.125f;
- break;
- default:
- imm = 1.0f;
- }
-
- src[0] = ureg_src(dst);
- src[1] = ureg_imm1f(t->ureg, imm);
- if (dstMod & GL_SATURATE_BIT_ATI) {
- dst = ureg_saturate(dst);
- }
- ureg_insn(t->ureg, TGSI_OPCODE_MUL, &dst, 1, src, 2, 0);
-}
-
-/**
- * Compile one setup instruction to TGSI instructions.
- */
-static void
-compile_setupinst(struct st_translate *t,
- const unsigned r,
- const struct atifs_setupinst *texinst)
-{
- struct ureg_dst dst[1];
- struct ureg_src src[2];
-
- if (!texinst->Opcode)
- return;
-
- dst[0] = get_temp(t, r);
-
- GLuint pass_tex = texinst->src;
-
- if (pass_tex >= GL_TEXTURE0_ARB && pass_tex <= GL_TEXTURE7_ARB) {
- unsigned attr = pass_tex - GL_TEXTURE0_ARB + VARYING_SLOT_TEX0;
-
- src[0] = t->inputs[t->inputMapping[attr]];
- } else if (pass_tex >= GL_REG_0_ATI && pass_tex <= GL_REG_5_ATI) {
- unsigned reg = pass_tex - GL_REG_0_ATI;
-
- /* the frontend already validated that REG is only allowed in second pass */
- if (t->regs_written[0][reg]) {
- src[0] = ureg_src(t->temps[reg]);
- } else {
- src[0] = ureg_imm1f(t->ureg, 0.0f);
- }
- }
- src[0] = apply_swizzle(t, src[0], texinst->swizzle);
-
- if (texinst->Opcode == ATI_FRAGMENT_SHADER_SAMPLE_OP) {
- /* by default texture and sampler indexes are the same */
- src[1] = t->samplers[r];
- /* the texture target is still unknown, it will be fixed in the draw call */
- ureg_tex_insn(t->ureg, TGSI_OPCODE_TEX, dst, 1, TGSI_TEXTURE_2D,
- TGSI_RETURN_TYPE_FLOAT, NULL, 0, src, 2);
- } else if (texinst->Opcode == ATI_FRAGMENT_SHADER_PASS_OP) {
- ureg_insn(t->ureg, TGSI_OPCODE_MOV, dst, 1, src, 1, 0);
- }
-
- t->regs_written[t->current_pass][r] = true;
-}
-
-/**
- * Compile one arithmetic operation COLOR&ALPHA pair into TGSI instructions.
- */
-static void
-compile_instruction(struct st_translate *t,
- const struct atifs_instruction *inst)
-{
- unsigned optype;
-
- for (optype = 0; optype < 2; optype++) { /* color, alpha */
- const struct instruction_desc *desc;
- struct ureg_dst dst[1];
- struct ureg_src args[3]; /* arguments for the main operation */
- unsigned arg;
- unsigned dstreg = inst->DstReg[optype].Index - GL_REG_0_ATI;
-
- if (!inst->Opcode[optype])
- continue;
-
- desc = &inst_desc[inst->Opcode[optype] - GL_MOV_ATI];
-
- /* prepare the arguments */
- for (arg = 0; arg < desc->arg_count; arg++) {
- if (arg >= inst->ArgCount[optype]) {
- _mesa_warning(0, "Using 0 for missing argument %d of %s\n",
- arg, desc->name);
- args[arg] = ureg_imm1f(t->ureg, 0.0f);
- } else {
- args[arg] = prepare_argument(t, arg,
- &inst->SrcReg[optype][arg]);
- }
- }
-
- /* prepare dst */
- dst[0] = get_temp(t, dstreg);
-
- dst[0] = ureg_writemask(dst[0], inst->DstReg[optype].dstMask);
-
- /* emit the main instruction */
- emit_arith_inst(t, desc, dst, args, arg);
-
- emit_dstmod(t, *dst, inst->DstReg[optype].dstMod);
-
- t->regs_written[t->current_pass][dstreg] = true;
- }
-}
-
-static void
-finalize_shader(struct st_translate *t, unsigned numPasses)
-{
- struct ureg_dst dst[1] = { { 0 } };
- struct ureg_src src[1] = { { 0 } };
-
- if (t->regs_written[numPasses-1][0]) {
- /* copy the result into the OUT slot */
- dst[0] = t->outputs[t->outputMapping[FRAG_RESULT_COLOR]];
- src[0] = ureg_src(t->temps[0]);
- ureg_insn(t->ureg, TGSI_OPCODE_MOV, dst, 1, src, 1, 0);
- }
-
- /* signal the end of the program */
- ureg_insn(t->ureg, TGSI_OPCODE_END, dst, 0, src, 0, 0);
-}
-
-/**
- * Called when a new variant is needed, we need to translate
- * the ATI fragment shader to TGSI
- */
-enum pipe_error
-st_translate_atifs_program(
- struct ureg_program *ureg,
- struct ati_fragment_shader *atifs,
- struct gl_program *program,
- GLuint numInputs,
- const ubyte inputMapping[],
- const ubyte inputSemanticName[],
- const ubyte inputSemanticIndex[],
- const ubyte interpMode[],
- GLuint numOutputs,
- const ubyte outputMapping[],
- const ubyte outputSemanticName[],
- const ubyte outputSemanticIndex[])
-{
- enum pipe_error ret = PIPE_OK;
-
- unsigned pass, i, r;
-
- struct st_translate translate, *t;
- t = &translate;
- memset(t, 0, sizeof *t);
-
- t->inputMapping = inputMapping;
- t->outputMapping = outputMapping;
- t->ureg = ureg;
- t->atifs = atifs;
-
- /*
- * Declare input attributes.
- */
- for (i = 0; i < numInputs; i++) {
- t->inputs[i] = ureg_DECL_fs_input(ureg,
- inputSemanticName[i],
- inputSemanticIndex[i],
- interpMode[i]);
- }
-
- /*
- * Declare output attributes:
- * we always have numOutputs=1 and it's FRAG_RESULT_COLOR
- */
- t->outputs[0] = ureg_DECL_output(ureg,
- TGSI_SEMANTIC_COLOR,
- outputSemanticIndex[0]);
-
- /* Emit constants and immediates. Mesa uses a single index space
- * for these, so we put all the translated regs in t->constants.
- */
- if (program->Parameters) {
- t->constants = calloc(program->Parameters->NumParameters,
- sizeof t->constants[0]);
- if (t->constants == NULL) {
- ret = PIPE_ERROR_OUT_OF_MEMORY;
- goto out;
- }
-
- for (i = 0; i < program->Parameters->NumParameters; i++) {
- unsigned pvo = program->Parameters->Parameters[i].ValueOffset;
-
- switch (program->Parameters->Parameters[i].Type) {
- case PROGRAM_STATE_VAR:
- case PROGRAM_UNIFORM:
- t->constants[i] = ureg_DECL_constant(ureg, i);
- break;
- case PROGRAM_CONSTANT:
- t->constants[i] =
- ureg_DECL_immediate(ureg,
- (const float*)program->Parameters->ParameterValues + pvo,
- 4);
- break;
- default:
- break;
- }
- }
- }
-
- /* texture samplers */
- for (i = 0; i < MAX_NUM_FRAGMENT_REGISTERS_ATI; i++) {
- if (program->SamplersUsed & (1 << i)) {
- t->samplers[i] = ureg_DECL_sampler(ureg, i);
- /* the texture target is still unknown, it will be fixed in the draw call */
- ureg_DECL_sampler_view(ureg, i, TGSI_TEXTURE_2D,
- TGSI_RETURN_TYPE_FLOAT,
- TGSI_RETURN_TYPE_FLOAT,
- TGSI_RETURN_TYPE_FLOAT,
- TGSI_RETURN_TYPE_FLOAT);
- }
- }
-
- /* emit instructions */
- for (pass = 0; pass < atifs->NumPasses; pass++) {
- t->current_pass = pass;
- for (r = 0; r < MAX_NUM_FRAGMENT_REGISTERS_ATI; r++) {
- struct atifs_setupinst *texinst = &atifs->SetupInst[pass][r];
- compile_setupinst(t, r, texinst);
- }
- for (i = 0; i < atifs->numArithInstr[pass]; i++) {
- struct atifs_instruction *inst = &atifs->Instructions[pass][i];
- compile_instruction(t, inst);
- }
- }
-
- finalize_shader(t, atifs->NumPasses);
-
-out:
- free(t->constants);
-
- if (t->error) {
- debug_printf("%s: translate error flag set\n", __func__);
- }
-
- return ret;
-}
-
-/**
- * Called in ProgramStringNotify, we need to fill the metadata of the
- * gl_program attached to the ati_fragment_shader
- */
-void
-st_init_atifs_prog(struct gl_context *ctx, struct gl_program *prog)
-{
- /* we know this is st_fragment_program, because of st_new_ati_fs() */
- struct st_program *stfp = (struct st_program *) prog;
- struct ati_fragment_shader *atifs = stfp->ati_fs;
-
- unsigned pass, i, r, optype, arg;
-
- static const gl_state_index16 fog_params_state[STATE_LENGTH] =
- {STATE_INTERNAL, STATE_FOG_PARAMS_OPTIMIZED, 0, 0 };
- static const gl_state_index16 fog_color[STATE_LENGTH] =
- {STATE_FOG_COLOR, 0, 0, 0 };
-
- prog->info.inputs_read = 0;
- prog->info.outputs_written = BITFIELD64_BIT(FRAG_RESULT_COLOR);
- prog->SamplersUsed = 0;
- prog->Parameters = _mesa_new_parameter_list();
-
- /* fill in inputs_read, SamplersUsed, TexturesUsed */
- for (pass = 0; pass < atifs->NumPasses; pass++) {
- for (r = 0; r < MAX_NUM_FRAGMENT_REGISTERS_ATI; r++) {
- struct atifs_setupinst *texinst = &atifs->SetupInst[pass][r];
- GLuint pass_tex = texinst->src;
-
- if (texinst->Opcode == ATI_FRAGMENT_SHADER_SAMPLE_OP) {
- /* mark which texcoords are used */
- prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_TEX0 + pass_tex - GL_TEXTURE0_ARB);
- /* by default there is 1:1 mapping between samplers and textures */
- prog->SamplersUsed |= (1 << r);
- /* the target is unknown here, it will be fixed in the draw call */
- prog->TexturesUsed[r] = TEXTURE_2D_BIT;
- } else if (texinst->Opcode == ATI_FRAGMENT_SHADER_PASS_OP) {
- if (pass_tex >= GL_TEXTURE0_ARB && pass_tex <= GL_TEXTURE7_ARB) {
- prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_TEX0 + pass_tex - GL_TEXTURE0_ARB);
- }
- }
- }
- }
- for (pass = 0; pass < atifs->NumPasses; pass++) {
- for (i = 0; i < atifs->numArithInstr[pass]; i++) {
- struct atifs_instruction *inst = &atifs->Instructions[pass][i];
-
- for (optype = 0; optype < 2; optype++) { /* color, alpha */
- if (inst->Opcode[optype]) {
- for (arg = 0; arg < inst->ArgCount[optype]; arg++) {
- GLint index = inst->SrcReg[optype][arg].Index;
- if (index == GL_PRIMARY_COLOR_EXT) {
- prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_COL0);
- } else if (index == GL_SECONDARY_INTERPOLATOR_ATI) {
- /* note: ATI_fragment_shader.txt never specifies what
- * GL_SECONDARY_INTERPOLATOR_ATI is, swrast uses
- * VARYING_SLOT_COL1 for this input */
- prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_COL1);
- }
- }
- }
- }
- }
- }
- /* we may need fog */
- prog->info.inputs_read |= BITFIELD64_BIT(VARYING_SLOT_FOGC);
-
- /* we always have the ATI_fs constants, and the fog params */
- for (i = 0; i < MAX_NUM_FRAGMENT_CONSTANTS_ATI; i++) {
- _mesa_add_parameter(prog->Parameters, PROGRAM_UNIFORM,
- NULL, 4, GL_FLOAT, NULL, NULL, true);
- }
- _mesa_add_state_reference(prog->Parameters, fog_params_state);
- _mesa_add_state_reference(prog->Parameters, fog_color);
-}
-
-
-struct tgsi_atifs_transform {
- struct tgsi_transform_context base;
- struct tgsi_shader_info info;
- const struct st_fp_variant_key *key;
- bool first_instruction_emitted;
- unsigned fog_factor_temp;
-};
-
-static inline struct tgsi_atifs_transform *
-tgsi_atifs_transform(struct tgsi_transform_context *tctx)
-{
- return (struct tgsi_atifs_transform *)tctx;
-}
-
-/* copied from st_cb_drawpixels_shader.c */
-static void
-set_src(struct tgsi_full_instruction *inst, unsigned i, unsigned file, unsigned index,
- unsigned x, unsigned y, unsigned z, unsigned w)
-{
- inst->Src[i].Register.File = file;
- inst->Src[i].Register.Index = index;
- inst->Src[i].Register.SwizzleX = x;
- inst->Src[i].Register.SwizzleY = y;
- inst->Src[i].Register.SwizzleZ = z;
- inst->Src[i].Register.SwizzleW = w;
- if (file == TGSI_FILE_CONSTANT) {
- inst->Src[i].Register.Dimension = 1;
- inst->Src[i].Dimension.Index = 0;
- }
-}
-
-#define SET_SRC(inst, i, file, index, x, y, z, w) \
- set_src(inst, i, file, index, TGSI_SWIZZLE_##x, TGSI_SWIZZLE_##y, \
- TGSI_SWIZZLE_##z, TGSI_SWIZZLE_##w)
-
-static void
-transform_decl(struct tgsi_transform_context *tctx,
- struct tgsi_full_declaration *decl)
-{
- struct tgsi_atifs_transform *ctx = tgsi_atifs_transform(tctx);
-
- if (decl->Declaration.File == TGSI_FILE_SAMPLER_VIEW) {
- /* fix texture target */
- unsigned newtarget = ctx->key->texture_targets[decl->Range.First];
- if (newtarget)
- decl->SamplerView.Resource = newtarget;
- }
-
- tctx->emit_declaration(tctx, decl);
-}
-
-static void
-transform_instr(struct tgsi_transform_context *tctx,
- struct tgsi_full_instruction *current_inst)
-{
- struct tgsi_atifs_transform *ctx = tgsi_atifs_transform(tctx);
-
- if (ctx->first_instruction_emitted)
- goto transform_inst;
-
- ctx->first_instruction_emitted = true;
-
- if (ctx->key->fog) {
- /* add a new temp for the fog factor */
- ctx->fog_factor_temp = ctx->info.file_max[TGSI_FILE_TEMPORARY] + 1;
- tgsi_transform_temp_decl(tctx, ctx->fog_factor_temp);
- }
-
-transform_inst:
- if (current_inst->Instruction.Opcode == TGSI_OPCODE_TEX) {
- /* fix texture target */
- unsigned newtarget = ctx->key->texture_targets[current_inst->Src[1].Register.Index];
- if (newtarget)
- current_inst->Texture.Texture = newtarget;
-
- } else if (ctx->key->fog && current_inst->Instruction.Opcode == TGSI_OPCODE_MOV &&
- current_inst->Dst[0].Register.File == TGSI_FILE_OUTPUT) {
- struct tgsi_full_instruction inst;
- unsigned i;
- int fogc_index = -1;
- int reg0_index = current_inst->Src[0].Register.Index;
-
- /* find FOGC input */
- for (i = 0; i < ctx->info.num_inputs; i++) {
- if (ctx->info.input_semantic_name[i] == TGSI_SEMANTIC_FOG) {
- fogc_index = i;
- break;
- }
- }
- if (fogc_index < 0) {
- /* should never be reached, because fog coord input is always declared */
- tctx->emit_instruction(tctx, current_inst);
- return;
- }
-
- /* compute the 1 component fog factor f */
- if (ctx->key->fog == FOG_LINEAR) {
- /* LINEAR formula: f = (end - z) / (end - start)
- * with optimized parameters:
- * f = MAD(fogcoord, oparams.x, oparams.y)
- */
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_MAD;
- inst.Instruction.NumDstRegs = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = ctx->fog_factor_temp;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 3;
- SET_SRC(&inst, 0, TGSI_FILE_INPUT, fogc_index, X, Y, Z, W);
- SET_SRC(&inst, 1, TGSI_FILE_CONSTANT, MAX_NUM_FRAGMENT_CONSTANTS_ATI, X, X, X, X);
- SET_SRC(&inst, 2, TGSI_FILE_CONSTANT, MAX_NUM_FRAGMENT_CONSTANTS_ATI, Y, Y, Y, Y);
- tctx->emit_instruction(tctx, &inst);
- } else if (ctx->key->fog == FOG_EXP) {
- /* EXP formula: f = exp(-dens * z)
- * with optimized parameters:
- * f = MUL(fogcoord, oparams.z); f= EX2(-f)
- */
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_MUL;
- inst.Instruction.NumDstRegs = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = ctx->fog_factor_temp;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 2;
- SET_SRC(&inst, 0, TGSI_FILE_INPUT, fogc_index, X, Y, Z, W);
- SET_SRC(&inst, 1, TGSI_FILE_CONSTANT, MAX_NUM_FRAGMENT_CONSTANTS_ATI, Z, Z, Z, Z);
- tctx->emit_instruction(tctx, &inst);
-
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_EX2;
- inst.Instruction.NumDstRegs = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = ctx->fog_factor_temp;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 1;
- SET_SRC(&inst, 0, TGSI_FILE_TEMPORARY, ctx->fog_factor_temp, X, Y, Z, W);
- inst.Src[0].Register.Negate = 1;
- tctx->emit_instruction(tctx, &inst);
- } else if (ctx->key->fog == FOG_EXP2) {
- /* EXP2 formula: f = exp(-(dens * z)^2)
- * with optimized parameters:
- * f = MUL(fogcoord, oparams.w); f=MUL(f, f); f= EX2(-f)
- */
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_MUL;
- inst.Instruction.NumDstRegs = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = ctx->fog_factor_temp;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 2;
- SET_SRC(&inst, 0, TGSI_FILE_INPUT, fogc_index, X, Y, Z, W);
- SET_SRC(&inst, 1, TGSI_FILE_CONSTANT, MAX_NUM_FRAGMENT_CONSTANTS_ATI, W, W, W, W);
- tctx->emit_instruction(tctx, &inst);
-
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_MUL;
- inst.Instruction.NumDstRegs = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = ctx->fog_factor_temp;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 2;
- SET_SRC(&inst, 0, TGSI_FILE_TEMPORARY, ctx->fog_factor_temp, X, Y, Z, W);
- SET_SRC(&inst, 1, TGSI_FILE_TEMPORARY, ctx->fog_factor_temp, X, Y, Z, W);
- tctx->emit_instruction(tctx, &inst);
-
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_EX2;
- inst.Instruction.NumDstRegs = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = ctx->fog_factor_temp;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 1;
- SET_SRC(&inst, 0, TGSI_FILE_TEMPORARY, ctx->fog_factor_temp, X, Y, Z, W);
- inst.Src[0].Register.Negate ^= 1;
- tctx->emit_instruction(tctx, &inst);
- }
- /* f = saturate(f) */
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_MOV;
- inst.Instruction.NumDstRegs = 1;
- inst.Instruction.Saturate = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = ctx->fog_factor_temp;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 1;
- SET_SRC(&inst, 0, TGSI_FILE_TEMPORARY, ctx->fog_factor_temp, X, Y, Z, W);
- tctx->emit_instruction(tctx, &inst);
-
- /* REG0 = LRP(f, REG0, fogcolor) */
- inst = tgsi_default_full_instruction();
- inst.Instruction.Opcode = TGSI_OPCODE_LRP;
- inst.Instruction.NumDstRegs = 1;
- inst.Dst[0].Register.File = TGSI_FILE_TEMPORARY;
- inst.Dst[0].Register.Index = reg0_index;
- inst.Dst[0].Register.WriteMask = TGSI_WRITEMASK_XYZW;
- inst.Instruction.NumSrcRegs = 3;
- SET_SRC(&inst, 0, TGSI_FILE_TEMPORARY, ctx->fog_factor_temp, X, X, X, Y);
- SET_SRC(&inst, 1, TGSI_FILE_TEMPORARY, reg0_index, X, Y, Z, W);
- SET_SRC(&inst, 2, TGSI_FILE_CONSTANT, MAX_NUM_FRAGMENT_CONSTANTS_ATI + 1, X, Y, Z, W);
- tctx->emit_instruction(tctx, &inst);
- }
-
- tctx->emit_instruction(tctx, current_inst);
-}
-
-/*
- * A post-process step in the draw call to fix texture targets and
- * insert code for fog.
- */
-const struct tgsi_token *
-st_fixup_atifs(const struct tgsi_token *tokens,
- const struct st_fp_variant_key *key)
-{
- struct tgsi_atifs_transform ctx;
- struct tgsi_token *newtoks;
- int newlen;
-
- memset(&ctx, 0, sizeof(ctx));
- ctx.base.transform_declaration = transform_decl;
- ctx.base.transform_instruction = transform_instr;
- ctx.key = key;
- tgsi_scan_shader(tokens, &ctx.info);
-
- newlen = tgsi_num_tokens(tokens) + 30;
- newtoks = tgsi_alloc_tokens(newlen);
- if (!newtoks)
- return NULL;
-
- tgsi_transform_shader(tokens, newtoks, newlen, &ctx.base);
- return newtoks;
-}
-