2 * Copyright © 2010 Intel Corporation
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
24 #include "main/core.h" /* for MAX2 */
26 #include "ir_visitor.h"
27 #include "glsl_types.h"
29 ir_rvalue::ir_rvalue()
31 this->type = glsl_type::error_type;
34 bool ir_rvalue::is_zero() const
39 bool ir_rvalue::is_one() const
44 bool ir_rvalue::is_negative_one() const
49 bool ir_rvalue::is_basis() const
55 * Modify the swizzle make to move one component to another
57 * \param m IR swizzle to be modified
58 * \param from Component in the RHS that is to be swizzled
59 * \param to Desired swizzle location of \c from
62 update_rhs_swizzle(ir_swizzle_mask &m, unsigned from, unsigned to)
65 case 0: m.x = from; break;
66 case 1: m.y = from; break;
67 case 2: m.z = from; break;
68 case 3: m.w = from; break;
69 default: assert(!"Should not get here.");
72 m.num_components = MAX2(m.num_components, (to + 1));
76 ir_assignment::set_lhs(ir_rvalue *lhs)
79 bool swizzled = false;
82 ir_swizzle *swiz = lhs->as_swizzle();
87 unsigned write_mask = 0;
88 ir_swizzle_mask rhs_swiz = { 0, 0, 0, 0, 0, 0 };
90 for (unsigned i = 0; i < swiz->mask.num_components; i++) {
94 case 0: c = swiz->mask.x; break;
95 case 1: c = swiz->mask.y; break;
96 case 2: c = swiz->mask.z; break;
97 case 3: c = swiz->mask.w; break;
98 default: assert(!"Should not get here.");
101 write_mask |= (((this->write_mask >> i) & 1) << c);
102 update_rhs_swizzle(rhs_swiz, i, c);
105 this->write_mask = write_mask;
108 this->rhs = new(mem_ctx) ir_swizzle(this->rhs, rhs_swiz);
113 /* Now, RHS channels line up with the LHS writemask. Collapse it
114 * to just the channels that will be written.
116 ir_swizzle_mask rhs_swiz = { 0, 0, 0, 0, 0, 0 };
118 for (int i = 0; i < 4; i++) {
119 if (write_mask & (1 << i))
120 update_rhs_swizzle(rhs_swiz, i, rhs_chan++);
122 this->rhs = new(mem_ctx) ir_swizzle(this->rhs, rhs_swiz);
125 assert((lhs == NULL) || lhs->as_dereference());
127 this->lhs = (ir_dereference *) lhs;
131 ir_assignment::whole_variable_written()
133 ir_variable *v = this->lhs->whole_variable_referenced();
138 if (v->type->is_scalar())
141 if (v->type->is_vector()) {
142 const unsigned mask = (1U << v->type->vector_elements) - 1;
144 if (mask != this->write_mask)
148 /* Either all the vector components are assigned or the variable is some
149 * composite type (and the whole thing is assigned.
154 ir_assignment::ir_assignment(ir_dereference *lhs, ir_rvalue *rhs,
155 ir_rvalue *condition, unsigned write_mask)
157 this->ir_type = ir_type_assignment;
158 this->condition = condition;
161 this->write_mask = write_mask;
163 if (lhs->type->is_scalar() || lhs->type->is_vector()) {
164 int lhs_components = 0;
165 for (int i = 0; i < 4; i++) {
166 if (write_mask & (1 << i))
170 assert(lhs_components == this->rhs->type->vector_elements);
174 ir_assignment::ir_assignment(ir_rvalue *lhs, ir_rvalue *rhs,
175 ir_rvalue *condition)
177 this->ir_type = ir_type_assignment;
178 this->condition = condition;
181 /* If the RHS is a vector type, assume that all components of the vector
182 * type are being written to the LHS. The write mask comes from the RHS
183 * because we can have a case where the LHS is a vec4 and the RHS is a
184 * vec3. In that case, the assignment is:
186 * (assign (...) (xyz) (var_ref lhs) (var_ref rhs))
188 if (rhs->type->is_vector())
189 this->write_mask = (1U << rhs->type->vector_elements) - 1;
190 else if (rhs->type->is_scalar())
191 this->write_mask = 1;
193 this->write_mask = 0;
199 ir_expression::ir_expression(int op, const struct glsl_type *type,
202 assert(get_num_operands(ir_expression_operation(op)) == 1);
203 this->ir_type = ir_type_expression;
205 this->operation = ir_expression_operation(op);
206 this->operands[0] = op0;
207 this->operands[1] = NULL;
208 this->operands[2] = NULL;
209 this->operands[3] = NULL;
212 ir_expression::ir_expression(int op, const struct glsl_type *type,
213 ir_rvalue *op0, ir_rvalue *op1)
215 assert(((op1 == NULL) && (get_num_operands(ir_expression_operation(op)) == 1))
216 || (get_num_operands(ir_expression_operation(op)) == 2));
217 this->ir_type = ir_type_expression;
219 this->operation = ir_expression_operation(op);
220 this->operands[0] = op0;
221 this->operands[1] = op1;
222 this->operands[2] = NULL;
223 this->operands[3] = NULL;
226 ir_expression::ir_expression(int op, const struct glsl_type *type,
227 ir_rvalue *op0, ir_rvalue *op1,
228 ir_rvalue *op2, ir_rvalue *op3)
230 this->ir_type = ir_type_expression;
232 this->operation = ir_expression_operation(op);
233 this->operands[0] = op0;
234 this->operands[1] = op1;
235 this->operands[2] = op2;
236 this->operands[3] = op3;
239 ir_expression::ir_expression(int op, ir_rvalue *op0)
241 this->ir_type = ir_type_expression;
243 this->operation = ir_expression_operation(op);
244 this->operands[0] = op0;
245 this->operands[1] = NULL;
246 this->operands[2] = NULL;
247 this->operands[3] = NULL;
249 assert(op <= ir_last_unop);
251 switch (this->operation) {
252 case ir_unop_bit_not:
253 case ir_unop_logic_not:
268 case ir_unop_round_even:
271 case ir_unop_sin_reduced:
272 case ir_unop_cos_reduced:
275 this->type = op0->type;
281 case ir_unop_bitcast_f2i:
282 this->type = glsl_type::get_instance(GLSL_TYPE_INT,
283 op0->type->vector_elements, 1);
289 case ir_unop_bitcast_i2f:
290 case ir_unop_bitcast_u2f:
291 this->type = glsl_type::get_instance(GLSL_TYPE_FLOAT,
292 op0->type->vector_elements, 1);
297 this->type = glsl_type::get_instance(GLSL_TYPE_BOOL,
298 op0->type->vector_elements, 1);
303 case ir_unop_bitcast_f2u:
304 this->type = glsl_type::get_instance(GLSL_TYPE_UINT,
305 op0->type->vector_elements, 1);
309 this->type = glsl_type::float_type;
313 this->type = glsl_type::bool_type;
317 assert(!"not reached: missing automatic type setup for ir_expression");
318 this->type = op0->type;
323 ir_expression::ir_expression(int op, ir_rvalue *op0, ir_rvalue *op1)
325 this->ir_type = ir_type_expression;
327 this->operation = ir_expression_operation(op);
328 this->operands[0] = op0;
329 this->operands[1] = op1;
330 this->operands[2] = NULL;
331 this->operands[3] = NULL;
333 assert(op > ir_last_unop);
335 switch (this->operation) {
336 case ir_binop_all_equal:
337 case ir_binop_any_nequal:
338 this->type = glsl_type::bool_type;
349 if (op0->type->is_scalar()) {
350 this->type = op1->type;
351 } else if (op1->type->is_scalar()) {
352 this->type = op0->type;
354 /* FINISHME: matrix types */
355 assert(!op0->type->is_matrix() && !op1->type->is_matrix());
356 assert(op0->type == op1->type);
357 this->type = op0->type;
361 case ir_binop_logic_and:
362 case ir_binop_logic_xor:
363 case ir_binop_logic_or:
364 case ir_binop_bit_and:
365 case ir_binop_bit_xor:
366 case ir_binop_bit_or:
367 if (op0->type->is_scalar()) {
368 this->type = op1->type;
369 } else if (op1->type->is_scalar()) {
370 this->type = op0->type;
375 case ir_binop_nequal:
376 case ir_binop_lequal:
377 case ir_binop_gequal:
379 case ir_binop_greater:
380 assert(op0->type == op1->type);
381 this->type = glsl_type::get_instance(GLSL_TYPE_BOOL,
382 op0->type->vector_elements, 1);
386 this->type = glsl_type::float_type;
389 case ir_binop_lshift:
390 case ir_binop_rshift:
391 this->type = op0->type;
395 assert(!"not reached: missing automatic type setup for ir_expression");
396 this->type = glsl_type::float_type;
401 ir_expression::get_num_operands(ir_expression_operation op)
403 assert(op <= ir_last_opcode);
405 if (op <= ir_last_unop)
408 if (op <= ir_last_binop)
411 if (op == ir_quadop_vector)
418 static const char *const operator_strs[] = {
486 const char *ir_expression::operator_string(ir_expression_operation op)
488 assert((unsigned int) op < Elements(operator_strs));
489 assert(Elements(operator_strs) == (ir_quadop_vector + 1));
490 return operator_strs[op];
493 const char *ir_expression::operator_string()
495 return operator_string(this->operation);
499 depth_layout_string(ir_depth_layout layout)
502 case ir_depth_layout_none: return "";
503 case ir_depth_layout_any: return "depth_any";
504 case ir_depth_layout_greater: return "depth_greater";
505 case ir_depth_layout_less: return "depth_less";
506 case ir_depth_layout_unchanged: return "depth_unchanged";
514 ir_expression_operation
515 ir_expression::get_operator(const char *str)
517 const int operator_count = sizeof(operator_strs) / sizeof(operator_strs[0]);
518 for (int op = 0; op < operator_count; op++) {
519 if (strcmp(str, operator_strs[op]) == 0)
520 return (ir_expression_operation) op;
522 return (ir_expression_operation) -1;
525 ir_constant::ir_constant()
527 this->ir_type = ir_type_constant;
530 ir_constant::ir_constant(const struct glsl_type *type,
531 const ir_constant_data *data)
533 assert((type->base_type >= GLSL_TYPE_UINT)
534 && (type->base_type <= GLSL_TYPE_BOOL));
536 this->ir_type = ir_type_constant;
538 memcpy(& this->value, data, sizeof(this->value));
541 ir_constant::ir_constant(float f)
543 this->ir_type = ir_type_constant;
544 this->type = glsl_type::float_type;
545 this->value.f[0] = f;
546 for (int i = 1; i < 16; i++) {
547 this->value.f[i] = 0;
551 ir_constant::ir_constant(unsigned int u)
553 this->ir_type = ir_type_constant;
554 this->type = glsl_type::uint_type;
555 this->value.u[0] = u;
556 for (int i = 1; i < 16; i++) {
557 this->value.u[i] = 0;
561 ir_constant::ir_constant(int i)
563 this->ir_type = ir_type_constant;
564 this->type = glsl_type::int_type;
565 this->value.i[0] = i;
566 for (int i = 1; i < 16; i++) {
567 this->value.i[i] = 0;
571 ir_constant::ir_constant(bool b)
573 this->ir_type = ir_type_constant;
574 this->type = glsl_type::bool_type;
575 this->value.b[0] = b;
576 for (int i = 1; i < 16; i++) {
577 this->value.b[i] = false;
581 ir_constant::ir_constant(const ir_constant *c, unsigned i)
583 this->ir_type = ir_type_constant;
584 this->type = c->type->get_base_type();
586 switch (this->type->base_type) {
587 case GLSL_TYPE_UINT: this->value.u[0] = c->value.u[i]; break;
588 case GLSL_TYPE_INT: this->value.i[0] = c->value.i[i]; break;
589 case GLSL_TYPE_FLOAT: this->value.f[0] = c->value.f[i]; break;
590 case GLSL_TYPE_BOOL: this->value.b[0] = c->value.b[i]; break;
591 default: assert(!"Should not get here."); break;
595 ir_constant::ir_constant(const struct glsl_type *type, exec_list *value_list)
597 this->ir_type = ir_type_constant;
600 assert(type->is_scalar() || type->is_vector() || type->is_matrix()
601 || type->is_record() || type->is_array());
603 if (type->is_array()) {
604 this->array_elements = ralloc_array(this, ir_constant *, type->length);
606 foreach_list(node, value_list) {
607 ir_constant *value = (ir_constant *) node;
608 assert(value->as_constant() != NULL);
610 this->array_elements[i++] = value;
615 /* If the constant is a record, the types of each of the entries in
616 * value_list must be a 1-for-1 match with the structure components. Each
617 * entry must also be a constant. Just move the nodes from the value_list
618 * to the list in the ir_constant.
620 /* FINISHME: Should there be some type checking and / or assertions here? */
621 /* FINISHME: Should the new constant take ownership of the nodes from
622 * FINISHME: value_list, or should it make copies?
624 if (type->is_record()) {
625 value_list->move_nodes_to(& this->components);
629 for (unsigned i = 0; i < 16; i++) {
630 this->value.u[i] = 0;
633 ir_constant *value = (ir_constant *) (value_list->head);
635 /* Constructors with exactly one scalar argument are special for vectors
636 * and matrices. For vectors, the scalar value is replicated to fill all
637 * the components. For matrices, the scalar fills the components of the
638 * diagonal while the rest is filled with 0.
640 if (value->type->is_scalar() && value->next->is_tail_sentinel()) {
641 if (type->is_matrix()) {
642 /* Matrix - fill diagonal (rest is already set to 0) */
643 assert(type->base_type == GLSL_TYPE_FLOAT);
644 for (unsigned i = 0; i < type->matrix_columns; i++)
645 this->value.f[i * type->vector_elements + i] = value->value.f[0];
647 /* Vector or scalar - fill all components */
648 switch (type->base_type) {
651 for (unsigned i = 0; i < type->components(); i++)
652 this->value.u[i] = value->value.u[0];
654 case GLSL_TYPE_FLOAT:
655 for (unsigned i = 0; i < type->components(); i++)
656 this->value.f[i] = value->value.f[0];
659 for (unsigned i = 0; i < type->components(); i++)
660 this->value.b[i] = value->value.b[0];
663 assert(!"Should not get here.");
670 if (type->is_matrix() && value->type->is_matrix()) {
671 assert(value->next->is_tail_sentinel());
673 /* From section 5.4.2 of the GLSL 1.20 spec:
674 * "If a matrix is constructed from a matrix, then each component
675 * (column i, row j) in the result that has a corresponding component
676 * (column i, row j) in the argument will be initialized from there."
678 unsigned cols = MIN2(type->matrix_columns, value->type->matrix_columns);
679 unsigned rows = MIN2(type->vector_elements, value->type->vector_elements);
680 for (unsigned i = 0; i < cols; i++) {
681 for (unsigned j = 0; j < rows; j++) {
682 const unsigned src = i * value->type->vector_elements + j;
683 const unsigned dst = i * type->vector_elements + j;
684 this->value.f[dst] = value->value.f[src];
688 /* "All other components will be initialized to the identity matrix." */
689 for (unsigned i = cols; i < type->matrix_columns; i++)
690 this->value.f[i * type->vector_elements + i] = 1.0;
695 /* Use each component from each entry in the value_list to initialize one
696 * component of the constant being constructed.
698 for (unsigned i = 0; i < type->components(); /* empty */) {
699 assert(value->as_constant() != NULL);
700 assert(!value->is_tail_sentinel());
702 for (unsigned j = 0; j < value->type->components(); j++) {
703 switch (type->base_type) {
705 this->value.u[i] = value->get_uint_component(j);
708 this->value.i[i] = value->get_int_component(j);
710 case GLSL_TYPE_FLOAT:
711 this->value.f[i] = value->get_float_component(j);
714 this->value.b[i] = value->get_bool_component(j);
717 /* FINISHME: What to do? Exceptions are not the answer.
723 if (i >= type->components())
727 value = (ir_constant *) value->next;
732 ir_constant::zero(void *mem_ctx, const glsl_type *type)
734 assert(type->is_scalar() || type->is_vector() || type->is_matrix()
735 || type->is_record() || type->is_array());
737 ir_constant *c = new(mem_ctx) ir_constant;
739 memset(&c->value, 0, sizeof(c->value));
741 if (type->is_array()) {
742 c->array_elements = ralloc_array(c, ir_constant *, type->length);
744 for (unsigned i = 0; i < type->length; i++)
745 c->array_elements[i] = ir_constant::zero(c, type->element_type());
748 if (type->is_record()) {
749 for (unsigned i = 0; i < type->length; i++) {
750 ir_constant *comp = ir_constant::zero(mem_ctx, type->fields.structure[i].type);
751 c->components.push_tail(comp);
759 ir_constant::get_bool_component(unsigned i) const
761 switch (this->type->base_type) {
762 case GLSL_TYPE_UINT: return this->value.u[i] != 0;
763 case GLSL_TYPE_INT: return this->value.i[i] != 0;
764 case GLSL_TYPE_FLOAT: return ((int)this->value.f[i]) != 0;
765 case GLSL_TYPE_BOOL: return this->value.b[i];
766 default: assert(!"Should not get here."); break;
769 /* Must return something to make the compiler happy. This is clearly an
776 ir_constant::get_float_component(unsigned i) const
778 switch (this->type->base_type) {
779 case GLSL_TYPE_UINT: return (float) this->value.u[i];
780 case GLSL_TYPE_INT: return (float) this->value.i[i];
781 case GLSL_TYPE_FLOAT: return this->value.f[i];
782 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1.0 : 0.0;
783 default: assert(!"Should not get here."); break;
786 /* Must return something to make the compiler happy. This is clearly an
793 ir_constant::get_int_component(unsigned i) const
795 switch (this->type->base_type) {
796 case GLSL_TYPE_UINT: return this->value.u[i];
797 case GLSL_TYPE_INT: return this->value.i[i];
798 case GLSL_TYPE_FLOAT: return (int) this->value.f[i];
799 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1 : 0;
800 default: assert(!"Should not get here."); break;
803 /* Must return something to make the compiler happy. This is clearly an
810 ir_constant::get_uint_component(unsigned i) const
812 switch (this->type->base_type) {
813 case GLSL_TYPE_UINT: return this->value.u[i];
814 case GLSL_TYPE_INT: return this->value.i[i];
815 case GLSL_TYPE_FLOAT: return (unsigned) this->value.f[i];
816 case GLSL_TYPE_BOOL: return this->value.b[i] ? 1 : 0;
817 default: assert(!"Should not get here."); break;
820 /* Must return something to make the compiler happy. This is clearly an
827 ir_constant::get_array_element(unsigned i) const
829 assert(this->type->is_array());
831 /* From page 35 (page 41 of the PDF) of the GLSL 1.20 spec:
833 * "Behavior is undefined if a shader subscripts an array with an index
834 * less than 0 or greater than or equal to the size the array was
837 * Most out-of-bounds accesses are removed before things could get this far.
838 * There are cases where non-constant array index values can get constant
843 else if (i >= this->type->length)
844 i = this->type->length - 1;
846 return array_elements[i];
850 ir_constant::get_record_field(const char *name)
852 int idx = this->type->field_index(name);
857 if (this->components.is_empty())
860 exec_node *node = this->components.head;
861 for (int i = 0; i < idx; i++) {
864 /* If the end of the list is encountered before the element matching the
865 * requested field is found, return NULL.
867 if (node->is_tail_sentinel())
871 return (ir_constant *) node;
875 ir_constant::copy_offset(ir_constant *src, int offset)
877 switch (this->type->base_type) {
880 case GLSL_TYPE_FLOAT:
881 case GLSL_TYPE_BOOL: {
882 unsigned int size = src->type->components();
883 assert (size <= this->type->components() - offset);
884 for (unsigned int i=0; i<size; i++) {
885 switch (this->type->base_type) {
887 value.u[i+offset] = src->get_uint_component(i);
890 value.i[i+offset] = src->get_int_component(i);
892 case GLSL_TYPE_FLOAT:
893 value.f[i+offset] = src->get_float_component(i);
896 value.b[i+offset] = src->get_bool_component(i);
898 default: // Shut up the compiler
905 case GLSL_TYPE_STRUCT: {
906 assert (src->type == this->type);
907 this->components.make_empty();
908 foreach_list(node, &src->components) {
909 ir_constant *const orig = (ir_constant *) node;
911 this->components.push_tail(orig->clone(this, NULL));
916 case GLSL_TYPE_ARRAY: {
917 assert (src->type == this->type);
918 for (unsigned i = 0; i < this->type->length; i++) {
919 this->array_elements[i] = src->array_elements[i]->clone(this, NULL);
925 assert(!"Should not get here.");
931 ir_constant::copy_masked_offset(ir_constant *src, int offset, unsigned int mask)
933 assert (!type->is_array() && !type->is_record());
935 if (!type->is_vector() && !type->is_matrix()) {
941 for (int i=0; i<4; i++) {
942 if (mask & (1 << i)) {
943 switch (this->type->base_type) {
945 value.u[i+offset] = src->get_uint_component(id++);
948 value.i[i+offset] = src->get_int_component(id++);
950 case GLSL_TYPE_FLOAT:
951 value.f[i+offset] = src->get_float_component(id++);
954 value.b[i+offset] = src->get_bool_component(id++);
957 assert(!"Should not get here.");
965 ir_constant::has_value(const ir_constant *c) const
967 if (this->type != c->type)
970 if (this->type->is_array()) {
971 for (unsigned i = 0; i < this->type->length; i++) {
972 if (!this->array_elements[i]->has_value(c->array_elements[i]))
978 if (this->type->base_type == GLSL_TYPE_STRUCT) {
979 const exec_node *a_node = this->components.head;
980 const exec_node *b_node = c->components.head;
982 while (!a_node->is_tail_sentinel()) {
983 assert(!b_node->is_tail_sentinel());
985 const ir_constant *const a_field = (ir_constant *) a_node;
986 const ir_constant *const b_field = (ir_constant *) b_node;
988 if (!a_field->has_value(b_field))
991 a_node = a_node->next;
992 b_node = b_node->next;
998 for (unsigned i = 0; i < this->type->components(); i++) {
999 switch (this->type->base_type) {
1000 case GLSL_TYPE_UINT:
1001 if (this->value.u[i] != c->value.u[i])
1005 if (this->value.i[i] != c->value.i[i])
1008 case GLSL_TYPE_FLOAT:
1009 if (this->value.f[i] != c->value.f[i])
1012 case GLSL_TYPE_BOOL:
1013 if (this->value.b[i] != c->value.b[i])
1017 assert(!"Should not get here.");
1026 ir_constant::is_zero() const
1028 if (!this->type->is_scalar() && !this->type->is_vector())
1031 for (unsigned c = 0; c < this->type->vector_elements; c++) {
1032 switch (this->type->base_type) {
1033 case GLSL_TYPE_FLOAT:
1034 if (this->value.f[c] != 0.0)
1038 if (this->value.i[c] != 0)
1041 case GLSL_TYPE_UINT:
1042 if (this->value.u[c] != 0)
1045 case GLSL_TYPE_BOOL:
1046 if (this->value.b[c] != false)
1050 /* The only other base types are structures, arrays, and samplers.
1051 * Samplers cannot be constants, and the others should have been
1052 * filtered out above.
1054 assert(!"Should not get here.");
1063 ir_constant::is_one() const
1065 if (!this->type->is_scalar() && !this->type->is_vector())
1068 for (unsigned c = 0; c < this->type->vector_elements; c++) {
1069 switch (this->type->base_type) {
1070 case GLSL_TYPE_FLOAT:
1071 if (this->value.f[c] != 1.0)
1075 if (this->value.i[c] != 1)
1078 case GLSL_TYPE_UINT:
1079 if (this->value.u[c] != 1)
1082 case GLSL_TYPE_BOOL:
1083 if (this->value.b[c] != true)
1087 /* The only other base types are structures, arrays, and samplers.
1088 * Samplers cannot be constants, and the others should have been
1089 * filtered out above.
1091 assert(!"Should not get here.");
1100 ir_constant::is_negative_one() const
1102 if (!this->type->is_scalar() && !this->type->is_vector())
1105 if (this->type->is_boolean())
1108 for (unsigned c = 0; c < this->type->vector_elements; c++) {
1109 switch (this->type->base_type) {
1110 case GLSL_TYPE_FLOAT:
1111 if (this->value.f[c] != -1.0)
1115 if (this->value.i[c] != -1)
1118 case GLSL_TYPE_UINT:
1119 if (int(this->value.u[c]) != -1)
1123 /* The only other base types are structures, arrays, samplers, and
1124 * booleans. Samplers cannot be constants, and the others should
1125 * have been filtered out above.
1127 assert(!"Should not get here.");
1136 ir_constant::is_basis() const
1138 if (!this->type->is_scalar() && !this->type->is_vector())
1141 if (this->type->is_boolean())
1145 for (unsigned c = 0; c < this->type->vector_elements; c++) {
1146 switch (this->type->base_type) {
1147 case GLSL_TYPE_FLOAT:
1148 if (this->value.f[c] == 1.0)
1150 else if (this->value.f[c] != 0.0)
1154 if (this->value.i[c] == 1)
1156 else if (this->value.i[c] != 0)
1159 case GLSL_TYPE_UINT:
1160 if (int(this->value.u[c]) == 1)
1162 else if (int(this->value.u[c]) != 0)
1166 /* The only other base types are structures, arrays, samplers, and
1167 * booleans. Samplers cannot be constants, and the others should
1168 * have been filtered out above.
1170 assert(!"Should not get here.");
1180 this->ir_type = ir_type_loop;
1181 this->cmp = ir_unop_neg;
1184 this->increment = NULL;
1185 this->counter = NULL;
1189 ir_dereference_variable::ir_dereference_variable(ir_variable *var)
1191 assert(var != NULL);
1193 this->ir_type = ir_type_dereference_variable;
1195 this->type = var->type;
1199 ir_dereference_array::ir_dereference_array(ir_rvalue *value,
1200 ir_rvalue *array_index)
1202 this->ir_type = ir_type_dereference_array;
1203 this->array_index = array_index;
1204 this->set_array(value);
1208 ir_dereference_array::ir_dereference_array(ir_variable *var,
1209 ir_rvalue *array_index)
1211 void *ctx = ralloc_parent(var);
1213 this->ir_type = ir_type_dereference_array;
1214 this->array_index = array_index;
1215 this->set_array(new(ctx) ir_dereference_variable(var));
1220 ir_dereference_array::set_array(ir_rvalue *value)
1222 assert(value != NULL);
1224 this->array = value;
1226 const glsl_type *const vt = this->array->type;
1228 if (vt->is_array()) {
1229 type = vt->element_type();
1230 } else if (vt->is_matrix()) {
1231 type = vt->column_type();
1232 } else if (vt->is_vector()) {
1233 type = vt->get_base_type();
1238 ir_dereference_record::ir_dereference_record(ir_rvalue *value,
1241 assert(value != NULL);
1243 this->ir_type = ir_type_dereference_record;
1244 this->record = value;
1245 this->field = ralloc_strdup(this, field);
1246 this->type = this->record->type->field_type(field);
1250 ir_dereference_record::ir_dereference_record(ir_variable *var,
1253 void *ctx = ralloc_parent(var);
1255 this->ir_type = ir_type_dereference_record;
1256 this->record = new(ctx) ir_dereference_variable(var);
1257 this->field = ralloc_strdup(this, field);
1258 this->type = this->record->type->field_type(field);
1262 ir_dereference::is_lvalue() const
1264 ir_variable *var = this->variable_referenced();
1266 /* Every l-value derference chain eventually ends in a variable.
1268 if ((var == NULL) || var->read_only)
1271 /* From page 17 (page 23 of the PDF) of the GLSL 1.20 spec:
1273 * "Samplers cannot be treated as l-values; hence cannot be used
1274 * as out or inout function parameters, nor can they be
1277 if (this->type->contains_sampler())
1284 const char *tex_opcode_strs[] = { "tex", "txb", "txl", "txd", "txf", "txs" };
1286 const char *ir_texture::opcode_string()
1288 assert((unsigned int) op <=
1289 sizeof(tex_opcode_strs) / sizeof(tex_opcode_strs[0]));
1290 return tex_opcode_strs[op];
1294 ir_texture::get_opcode(const char *str)
1296 const int count = sizeof(tex_opcode_strs) / sizeof(tex_opcode_strs[0]);
1297 for (int op = 0; op < count; op++) {
1298 if (strcmp(str, tex_opcode_strs[op]) == 0)
1299 return (ir_texture_opcode) op;
1301 return (ir_texture_opcode) -1;
1306 ir_texture::set_sampler(ir_dereference *sampler, const glsl_type *type)
1308 assert(sampler != NULL);
1309 assert(type != NULL);
1310 this->sampler = sampler;
1313 if (this->op == ir_txs) {
1314 assert(type->base_type == GLSL_TYPE_INT);
1316 assert(sampler->type->sampler_type == (int) type->base_type);
1317 if (sampler->type->sampler_shadow)
1318 assert(type->vector_elements == 4 || type->vector_elements == 1);
1320 assert(type->vector_elements == 4);
1326 ir_swizzle::init_mask(const unsigned *comp, unsigned count)
1328 assert((count >= 1) && (count <= 4));
1330 memset(&this->mask, 0, sizeof(this->mask));
1331 this->mask.num_components = count;
1333 unsigned dup_mask = 0;
1336 assert(comp[3] <= 3);
1337 dup_mask |= (1U << comp[3])
1338 & ((1U << comp[0]) | (1U << comp[1]) | (1U << comp[2]));
1339 this->mask.w = comp[3];
1342 assert(comp[2] <= 3);
1343 dup_mask |= (1U << comp[2])
1344 & ((1U << comp[0]) | (1U << comp[1]));
1345 this->mask.z = comp[2];
1348 assert(comp[1] <= 3);
1349 dup_mask |= (1U << comp[1])
1350 & ((1U << comp[0]));
1351 this->mask.y = comp[1];
1354 assert(comp[0] <= 3);
1355 this->mask.x = comp[0];
1358 this->mask.has_duplicates = dup_mask != 0;
1360 /* Based on the number of elements in the swizzle and the base type
1361 * (i.e., float, int, unsigned, or bool) of the vector being swizzled,
1362 * generate the type of the resulting value.
1364 type = glsl_type::get_instance(val->type->base_type, mask.num_components, 1);
1367 ir_swizzle::ir_swizzle(ir_rvalue *val, unsigned x, unsigned y, unsigned z,
1368 unsigned w, unsigned count)
1371 const unsigned components[4] = { x, y, z, w };
1372 this->ir_type = ir_type_swizzle;
1373 this->init_mask(components, count);
1376 ir_swizzle::ir_swizzle(ir_rvalue *val, const unsigned *comp,
1380 this->ir_type = ir_type_swizzle;
1381 this->init_mask(comp, count);
1384 ir_swizzle::ir_swizzle(ir_rvalue *val, ir_swizzle_mask mask)
1386 this->ir_type = ir_type_swizzle;
1389 this->type = glsl_type::get_instance(val->type->base_type,
1390 mask.num_components, 1);
1399 ir_swizzle::create(ir_rvalue *val, const char *str, unsigned vector_length)
1401 void *ctx = ralloc_parent(val);
1403 /* For each possible swizzle character, this table encodes the value in
1404 * \c idx_map that represents the 0th element of the vector. For invalid
1405 * swizzle characters (e.g., 'k'), a special value is used that will allow
1406 * detection of errors.
1408 static const unsigned char base_idx[26] = {
1409 /* a b c d e f g h i j k l m */
1410 R, R, I, I, I, I, R, I, I, I, I, I, I,
1411 /* n o p q r s t u v w x y z */
1412 I, I, S, S, R, S, S, I, I, X, X, X, X
1415 /* Each valid swizzle character has an entry in the previous table. This
1416 * table encodes the base index encoded in the previous table plus the actual
1417 * index of the swizzle character. When processing swizzles, the first
1418 * character in the string is indexed in the previous table. Each character
1419 * in the string is indexed in this table, and the value found there has the
1420 * value form the first table subtracted. The result must be on the range
1423 * For example, the string "wzyx" will get X from the first table. Each of
1424 * the charcaters will get X+3, X+2, X+1, and X+0 from this table. After
1425 * subtraction, the swizzle values are { 3, 2, 1, 0 }.
1427 * The string "wzrg" will get X from the first table. Each of the characters
1428 * will get X+3, X+2, R+0, and R+1 from this table. After subtraction, the
1429 * swizzle values are { 3, 2, 4, 5 }. Since 4 and 5 are outside the range
1430 * [0,3], the error is detected.
1432 static const unsigned char idx_map[26] = {
1433 /* a b c d e f g h i j k l m */
1434 R+3, R+2, 0, 0, 0, 0, R+1, 0, 0, 0, 0, 0, 0,
1435 /* n o p q r s t u v w x y z */
1436 0, 0, S+2, S+3, R+0, S+0, S+1, 0, 0, X+3, X+0, X+1, X+2
1439 int swiz_idx[4] = { 0, 0, 0, 0 };
1443 /* Validate the first character in the swizzle string and look up the base
1444 * index value as described above.
1446 if ((str[0] < 'a') || (str[0] > 'z'))
1449 const unsigned base = base_idx[str[0] - 'a'];
1452 for (i = 0; (i < 4) && (str[i] != '\0'); i++) {
1453 /* Validate the next character, and, as described above, convert it to a
1456 if ((str[i] < 'a') || (str[i] > 'z'))
1459 swiz_idx[i] = idx_map[str[i] - 'a'] - base;
1460 if ((swiz_idx[i] < 0) || (swiz_idx[i] >= (int) vector_length))
1467 return new(ctx) ir_swizzle(val, swiz_idx[0], swiz_idx[1], swiz_idx[2],
1477 ir_swizzle::variable_referenced() const
1479 return this->val->variable_referenced();
1483 ir_variable::ir_variable(const struct glsl_type *type, const char *name,
1484 ir_variable_mode mode)
1485 : max_array_access(0), read_only(false), centroid(false), invariant(false),
1486 mode(mode), interpolation(INTERP_QUALIFIER_NONE)
1488 this->ir_type = ir_type_variable;
1490 this->name = ralloc_strdup(this, name);
1491 this->explicit_location = false;
1492 this->has_initializer = false;
1493 this->location = -1;
1494 this->uniform_block = -1;
1495 this->warn_extension = NULL;
1496 this->constant_value = NULL;
1497 this->constant_initializer = NULL;
1498 this->origin_upper_left = false;
1499 this->pixel_center_integer = false;
1500 this->depth_layout = ir_depth_layout_none;
1503 if (type && type->base_type == GLSL_TYPE_SAMPLER)
1504 this->read_only = true;
1509 ir_variable::interpolation_string() const
1511 switch (this->interpolation) {
1512 case INTERP_QUALIFIER_NONE: return "no";
1513 case INTERP_QUALIFIER_SMOOTH: return "smooth";
1514 case INTERP_QUALIFIER_FLAT: return "flat";
1515 case INTERP_QUALIFIER_NOPERSPECTIVE: return "noperspective";
1518 assert(!"Should not get here.");
1523 glsl_interp_qualifier
1524 ir_variable::determine_interpolation_mode(bool flat_shade)
1526 if (this->interpolation != INTERP_QUALIFIER_NONE)
1527 return (glsl_interp_qualifier) this->interpolation;
1528 int location = this->location;
1530 location == FRAG_ATTRIB_COL0 || location == FRAG_ATTRIB_COL1;
1531 if (flat_shade && is_gl_Color)
1532 return INTERP_QUALIFIER_FLAT;
1534 return INTERP_QUALIFIER_SMOOTH;
1538 ir_function_signature::ir_function_signature(const glsl_type *return_type)
1539 : return_type(return_type), is_defined(false), _function(NULL)
1541 this->ir_type = ir_type_function_signature;
1542 this->is_builtin = false;
1543 this->origin = NULL;
1548 modes_match(unsigned a, unsigned b)
1553 /* Accept "in" vs. "const in" */
1554 if ((a == ir_var_const_in && b == ir_var_in) ||
1555 (b == ir_var_const_in && a == ir_var_in))
1563 ir_function_signature::qualifiers_match(exec_list *params)
1565 exec_list_iterator iter_a = parameters.iterator();
1566 exec_list_iterator iter_b = params->iterator();
1568 /* check that the qualifiers match. */
1569 while (iter_a.has_next()) {
1570 ir_variable *a = (ir_variable *)iter_a.get();
1571 ir_variable *b = (ir_variable *)iter_b.get();
1573 if (a->read_only != b->read_only ||
1574 !modes_match(a->mode, b->mode) ||
1575 a->interpolation != b->interpolation ||
1576 a->centroid != b->centroid) {
1578 /* parameter a's qualifiers don't match */
1590 ir_function_signature::replace_parameters(exec_list *new_params)
1592 /* Destroy all of the previous parameter information. If the previous
1593 * parameter information comes from the function prototype, it may either
1594 * specify incorrect parameter names or not have names at all.
1596 foreach_iter(exec_list_iterator, iter, parameters) {
1597 assert(((ir_instruction *) iter.get())->as_variable() != NULL);
1602 new_params->move_nodes_to(¶meters);
1606 ir_function::ir_function(const char *name)
1608 this->ir_type = ir_type_function;
1609 this->name = ralloc_strdup(this, name);
1614 ir_function::has_user_signature()
1616 foreach_list(n, &this->signatures) {
1617 ir_function_signature *const sig = (ir_function_signature *) n;
1618 if (!sig->is_builtin)
1626 ir_rvalue::error_value(void *mem_ctx)
1628 ir_rvalue *v = new(mem_ctx) ir_rvalue;
1630 v->type = glsl_type::error_type;
1636 visit_exec_list(exec_list *list, ir_visitor *visitor)
1638 foreach_iter(exec_list_iterator, iter, *list) {
1639 ((ir_instruction *)iter.get())->accept(visitor);
1645 steal_memory(ir_instruction *ir, void *new_ctx)
1647 ir_variable *var = ir->as_variable();
1648 ir_constant *constant = ir->as_constant();
1649 if (var != NULL && var->constant_value != NULL)
1650 steal_memory(var->constant_value, ir);
1652 if (var != NULL && var->constant_initializer != NULL)
1653 steal_memory(var->constant_initializer, ir);
1655 /* The components of aggregate constants are not visited by the normal
1656 * visitor, so steal their values by hand.
1658 if (constant != NULL) {
1659 if (constant->type->is_record()) {
1660 foreach_iter(exec_list_iterator, iter, constant->components) {
1661 ir_constant *field = (ir_constant *)iter.get();
1662 steal_memory(field, ir);
1664 } else if (constant->type->is_array()) {
1665 for (unsigned int i = 0; i < constant->type->length; i++) {
1666 steal_memory(constant->array_elements[i], ir);
1671 ralloc_steal(new_ctx, ir);
1676 reparent_ir(exec_list *list, void *mem_ctx)
1678 foreach_list(node, list) {
1679 visit_tree((ir_instruction *) node, steal_memory, mem_ctx);
1685 try_min_one(ir_rvalue *ir)
1687 ir_expression *expr = ir->as_expression();
1689 if (!expr || expr->operation != ir_binop_min)
1692 if (expr->operands[0]->is_one())
1693 return expr->operands[1];
1695 if (expr->operands[1]->is_one())
1696 return expr->operands[0];
1702 try_max_zero(ir_rvalue *ir)
1704 ir_expression *expr = ir->as_expression();
1706 if (!expr || expr->operation != ir_binop_max)
1709 if (expr->operands[0]->is_zero())
1710 return expr->operands[1];
1712 if (expr->operands[1]->is_zero())
1713 return expr->operands[0];
1719 ir_rvalue::as_rvalue_to_saturate()
1721 ir_expression *expr = this->as_expression();
1726 ir_rvalue *max_zero = try_max_zero(expr);
1728 return try_min_one(max_zero);
1730 ir_rvalue *min_one = try_min_one(expr);
1732 return try_max_zero(min_one);