Tizen 2.1 base
[sdk/emulator/qemu.git] / gl / mesa / src / mesa / drivers / dri / intel / intel_decode.c
1 #include <stdint.h>
2 #include <stdio.h>
3 #include <stdarg.h>
4 #include <string.h>
5
6 #include "intel_decode.h"
7 #include "intel_chipset.h"
8
9 static FILE *out;
10 static uint32_t saved_s2 = 0, saved_s4 = 0;
11 static char saved_s2_set = 0, saved_s4_set = 0;
12 static uint32_t head_offset = 0xffffffff; /* undefined */
13 static uint32_t tail_offset = 0xffffffff; /* undefined */
14
15 #ifndef ARRAY_SIZE
16 #define ARRAY_SIZE(A) (sizeof(A)/sizeof(A[0]))
17 #endif
18
19 #define BUFFER_FAIL(_count, _len, _name) do {                   \
20     fprintf(out, "Buffer size too small in %s (%d < %d)\n",     \
21             (_name), (_count), (_len));                         \
22     (*failures)++;                                              \
23     return count;                                               \
24 } while (0)
25
26
27 static float
28 int_as_float(uint32_t intval)
29 {
30     union intfloat {
31         uint32_t i;
32         float f;
33     } uval;
34
35     uval.i = intval;
36     return uval.f;
37 }
38
39 static void
40 instr_out(uint32_t *data, uint32_t hw_offset, unsigned int index,
41           char *fmt, ...)
42 {
43     va_list va;
44     char *parseinfo;
45     uint32_t offset = hw_offset + index * 4;
46
47     if (offset == head_offset)
48         parseinfo = "HEAD";
49     else if (offset == tail_offset)
50         parseinfo = "TAIL";
51     else
52         parseinfo = "    ";
53
54     fprintf(out, "0x%08x: %s 0x%08x: %s", offset, parseinfo,
55             data[index],
56             index == 0 ? "" : "   ");
57     va_start(va, fmt);
58     vfprintf(out, fmt, va);
59     va_end(va);
60 }
61
62 static int
63 decode_mi(uint32_t *data, int count, uint32_t hw_offset, int *failures)
64 {
65     unsigned int opcode;
66
67     struct {
68         uint32_t opcode;
69         int len_mask;
70         int min_len;
71         int max_len;
72         char *name;
73     } opcodes_mi[] = {
74         { 0x08, 0, 1, 1, "MI_ARB_ON_OFF" },
75         { 0x0a, 0, 1, 1, "MI_BATCH_BUFFER_END" },
76         { 0x30, 0x3f, 3, 3, "MI_BATCH_BUFFER" },
77         { 0x31, 0x3f, 2, 2, "MI_BATCH_BUFFER_START" },
78         { 0x14, 0x3f, 3, 3, "MI_DISPLAY_BUFFER_INFO" },
79         { 0x04, 0, 1, 1, "MI_FLUSH" },
80         { 0x22, 0x1f, 3, 3, "MI_LOAD_REGISTER_IMM" },
81         { 0x13, 0x3f, 2, 2, "MI_LOAD_SCAN_LINES_EXCL" },
82         { 0x12, 0x3f, 2, 2, "MI_LOAD_SCAN_LINES_INCL" },
83         { 0x00, 0, 1, 1, "MI_NOOP" },
84         { 0x11, 0x3f, 2, 2, "MI_OVERLAY_FLIP" },
85         { 0x07, 0, 1, 1, "MI_REPORT_HEAD" },
86         { 0x18, 0x3f, 2, 2, "MI_SET_CONTEXT" },
87         { 0x20, 0x3f, 3, 4, "MI_STORE_DATA_IMM" },
88         { 0x21, 0x3f, 3, 4, "MI_STORE_DATA_INDEX" },
89         { 0x24, 0x3f, 3, 3, "MI_STORE_REGISTER_MEM" },
90         { 0x02, 0, 1, 1, "MI_USER_INTERRUPT" },
91         { 0x03, 0, 1, 1, "MI_WAIT_FOR_EVENT" },
92         { 0x16, 0x7f, 3, 3, "MI_SEMAPHORE_MBOX" },
93         { 0x26, 0x1f, 3, 4, "MI_FLUSH_DW" },
94         { 0x0b, 0, 1, 1, "MI_SUSPEND_FLUSH" },
95     };
96
97     switch ((data[0] & 0x1f800000) >> 23) {
98     case 0x0a:
99         instr_out(data, hw_offset, 0, "MI_BATCH_BUFFER_END\n");
100         return -1;
101     }
102
103     for (opcode = 0; opcode < sizeof(opcodes_mi) / sizeof(opcodes_mi[0]);
104          opcode++) {
105         if ((data[0] & 0x1f800000) >> 23 == opcodes_mi[opcode].opcode) {
106             unsigned int len = 1, i;
107
108             instr_out(data, hw_offset, 0, "%s\n", opcodes_mi[opcode].name);
109             if (opcodes_mi[opcode].max_len > 1) {
110                 len = (data[0] & opcodes_mi[opcode].len_mask) + 2;
111                 if (len < opcodes_mi[opcode].min_len ||
112                     len > opcodes_mi[opcode].max_len)
113                 {
114                     fprintf(out, "Bad length (%d) in %s, [%d, %d]\n",
115                             len, opcodes_mi[opcode].name,
116                             opcodes_mi[opcode].min_len,
117                             opcodes_mi[opcode].max_len);
118                 }
119             }
120
121             for (i = 1; i < len; i++) {
122                 if (i >= count)
123                     BUFFER_FAIL(count, len, opcodes_mi[opcode].name);
124                 instr_out(data, hw_offset, i, "dword %d\n", i);
125             }
126
127             return len;
128         }
129     }
130
131     instr_out(data, hw_offset, 0, "MI UNKNOWN\n");
132     (*failures)++;
133     return 1;
134 }
135
136 static int
137 decode_2d(uint32_t *data, int count, uint32_t hw_offset, int *failures)
138 {
139     unsigned int opcode, len;
140     char *format = NULL;
141
142     struct {
143         uint32_t opcode;
144         int min_len;
145         int max_len;
146         char *name;
147     } opcodes_2d[] = {
148         { 0x40, 5, 5, "COLOR_BLT" },
149         { 0x43, 6, 6, "SRC_COPY_BLT" },
150         { 0x01, 8, 8, "XY_SETUP_BLT" },
151         { 0x11, 9, 9, "XY_SETUP_MONO_PATTERN_SL_BLT" },
152         { 0x03, 3, 3, "XY_SETUP_CLIP_BLT" },
153         { 0x24, 2, 2, "XY_PIXEL_BLT" },
154         { 0x25, 3, 3, "XY_SCANLINES_BLT" },
155         { 0x26, 4, 4, "Y_TEXT_BLT" },
156         { 0x31, 5, 134, "XY_TEXT_IMMEDIATE_BLT" },
157         { 0x50, 6, 6, "XY_COLOR_BLT" },
158         { 0x51, 6, 6, "XY_PAT_BLT" },
159         { 0x76, 8, 8, "XY_PAT_CHROMA_BLT" },
160         { 0x72, 7, 135, "XY_PAT_BLT_IMMEDIATE" },
161         { 0x77, 9, 137, "XY_PAT_CHROMA_BLT_IMMEDIATE" },
162         { 0x52, 9, 9, "XY_MONO_PAT_BLT" },
163         { 0x59, 7, 7, "XY_MONO_PAT_FIXED_BLT" },
164         { 0x53, 8, 8, "XY_SRC_COPY_BLT" },
165         { 0x54, 8, 8, "XY_MONO_SRC_COPY_BLT" },
166         { 0x71, 9, 137, "XY_MONO_SRC_COPY_IMMEDIATE_BLT" },
167         { 0x55, 9, 9, "XY_FULL_BLT" },
168         { 0x55, 9, 137, "XY_FULL_IMMEDIATE_PATTERN_BLT" },
169         { 0x56, 9, 9, "XY_FULL_MONO_SRC_BLT" },
170         { 0x75, 10, 138, "XY_FULL_MONO_SRC_IMMEDIATE_PATTERN_BLT" },
171         { 0x57, 12, 12, "XY_FULL_MONO_PATTERN_BLT" },
172         { 0x58, 12, 12, "XY_FULL_MONO_PATTERN_MONO_SRC_BLT" },
173     };
174
175     switch ((data[0] & 0x1fc00000) >> 22) {
176     case 0x50:
177         instr_out(data, hw_offset, 0,
178                   "XY_COLOR_BLT (rgb %sabled, alpha %sabled, dst tile %d)\n",
179                   (data[0] & (1 << 20)) ? "en" : "dis",
180                   (data[0] & (1 << 21)) ? "en" : "dis",
181                   (data[0] >> 11) & 1);
182
183         len = (data[0] & 0x000000ff) + 2;
184         if (len != 6)
185             fprintf(out, "Bad count in XY_COLOR_BLT\n");
186         if (count < 6)
187             BUFFER_FAIL(count, len, "XY_COLOR_BLT");
188
189         switch ((data[1] >> 24) & 0x3) {
190         case 0:
191             format="8";
192             break;
193         case 1:
194             format="565";
195             break;
196         case 2:
197             format="1555";
198             break;
199         case 3:
200             format="8888";
201             break;
202         }
203
204         instr_out(data, hw_offset, 1, "format %s, pitch %d, "
205                   "clipping %sabled\n", format,
206                   (short)(data[1] & 0xffff),
207                   data[1] & (1 << 30) ? "en" : "dis");
208         instr_out(data, hw_offset, 2, "(%d,%d)\n",
209                   data[2] & 0xffff, data[2] >> 16);
210         instr_out(data, hw_offset, 3, "(%d,%d)\n",
211                   data[3] & 0xffff, data[3] >> 16);
212         instr_out(data, hw_offset, 4, "offset 0x%08x\n", data[4]);
213         instr_out(data, hw_offset, 5, "color\n");
214         return len;
215     case 0x53:
216         instr_out(data, hw_offset, 0,
217                   "XY_SRC_COPY_BLT (rgb %sabled, alpha %sabled, "
218                   "src tile %d, dst tile %d)\n",
219                   (data[0] & (1 << 20)) ? "en" : "dis",
220                   (data[0] & (1 << 21)) ? "en" : "dis",
221                   (data[0] >> 15) & 1,
222                   (data[0] >> 11) & 1);
223
224         len = (data[0] & 0x000000ff) + 2;
225         if (len != 8)
226             fprintf(out, "Bad count in XY_SRC_COPY_BLT\n");
227         if (count < 8)
228             BUFFER_FAIL(count, len, "XY_SRC_COPY_BLT");
229
230         switch ((data[1] >> 24) & 0x3) {
231         case 0:
232             format="8";
233             break;
234         case 1:
235             format="565";
236             break;
237         case 2:
238             format="1555";
239             break;
240         case 3:
241             format="8888";
242             break;
243         }
244
245         instr_out(data, hw_offset, 1, "format %s, dst pitch %d, "
246                   "clipping %sabled\n", format,
247                   (short)(data[1] & 0xffff),
248                   data[1] & (1 << 30) ? "en" : "dis");
249         instr_out(data, hw_offset, 2, "dst (%d,%d)\n",
250                   data[2] & 0xffff, data[2] >> 16);
251         instr_out(data, hw_offset, 3, "dst (%d,%d)\n",
252                   data[3] & 0xffff, data[3] >> 16);
253         instr_out(data, hw_offset, 4, "dst offset 0x%08x\n", data[4]);
254         instr_out(data, hw_offset, 5, "src (%d,%d)\n",
255                   data[5] & 0xffff, data[5] >> 16);
256         instr_out(data, hw_offset, 6, "src pitch %d\n",
257                   (short)(data[6] & 0xffff));
258         instr_out(data, hw_offset, 7, "src offset 0x%08x\n", data[7]);
259         return len;
260     }
261
262     for (opcode = 0; opcode < sizeof(opcodes_2d) / sizeof(opcodes_2d[0]);
263          opcode++) {
264         if ((data[0] & 0x1fc00000) >> 22 == opcodes_2d[opcode].opcode) {
265             unsigned int i;
266
267             len = 1;
268             instr_out(data, hw_offset, 0, "%s\n", opcodes_2d[opcode].name);
269             if (opcodes_2d[opcode].max_len > 1) {
270                 len = (data[0] & 0x000000ff) + 2;
271                 if (len < opcodes_2d[opcode].min_len ||
272                     len > opcodes_2d[opcode].max_len)
273                 {
274                     fprintf(out, "Bad count in %s\n", opcodes_2d[opcode].name);
275                 }
276             }
277
278             for (i = 1; i < len; i++) {
279                 if (i >= count)
280                     BUFFER_FAIL(count, len, opcodes_2d[opcode].name);
281                 instr_out(data, hw_offset, i, "dword %d\n", i);
282             }
283
284             return len;
285         }
286     }
287
288     instr_out(data, hw_offset, 0, "2D UNKNOWN\n");
289     (*failures)++;
290     return 1;
291 }
292
293 static int
294 decode_3d_1c(uint32_t *data, int count, uint32_t hw_offset, int *failures)
295 {
296     uint32_t opcode;
297
298     opcode = (data[0] & 0x00f80000) >> 19;
299
300     switch (opcode) {
301     case 0x11:
302         instr_out(data, hw_offset, 0, "3DSTATE_DEPTH_SUBRECTANGLE_DISABLE\n");
303         return 1;
304     case 0x10:
305         instr_out(data, hw_offset, 0, "3DSTATE_SCISSOR_ENABLE %s\n",
306                 data[0]&1?"enabled":"disabled");
307         return 1;
308     case 0x01:
309         instr_out(data, hw_offset, 0, "3DSTATE_MAP_COORD_SET_I830\n");
310         return 1;
311     case 0x0a:
312         instr_out(data, hw_offset, 0, "3DSTATE_MAP_CUBE_I830\n");
313         return 1;
314     case 0x05:
315         instr_out(data, hw_offset, 0, "3DSTATE_MAP_TEX_STREAM_I830\n");
316         return 1;
317     }
318
319     instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_1c opcode = 0x%x\n",
320               opcode);
321     (*failures)++;
322     return 1;
323 }
324
325 /** Sets the string dstname to describe the destination of the PS instruction */
326 static void
327 i915_get_instruction_dst(uint32_t *data, int i, char *dstname, int do_mask)
328 {
329     uint32_t a0 = data[i];
330     int dst_nr = (a0 >> 14) & 0xf;
331     char dstmask[8];
332     char *sat;
333
334     if (do_mask) {
335         if (((a0 >> 10) & 0xf) == 0xf) {
336             dstmask[0] = 0;
337         } else {
338             int dstmask_index = 0;
339
340             dstmask[dstmask_index++] = '.';
341             if (a0 & (1 << 10))
342                 dstmask[dstmask_index++] = 'x';
343             if (a0 & (1 << 11))
344                 dstmask[dstmask_index++] = 'y';
345             if (a0 & (1 << 12))
346                 dstmask[dstmask_index++] = 'z';
347             if (a0 & (1 << 13))
348                 dstmask[dstmask_index++] = 'w';
349             dstmask[dstmask_index++] = 0;
350         }
351
352         if (a0 & (1 << 22))
353             sat = ".sat";
354         else
355             sat = "";
356     } else {
357         dstmask[0] = 0;
358         sat = "";
359     }
360
361     switch ((a0 >> 19) & 0x7) {
362     case 0:
363         if (dst_nr > 15)
364             fprintf(out, "bad destination reg R%d\n", dst_nr);
365         sprintf(dstname, "R%d%s%s", dst_nr, dstmask, sat);
366         break;
367     case 4:
368         if (dst_nr > 0)
369             fprintf(out, "bad destination reg oC%d\n", dst_nr);
370         sprintf(dstname, "oC%s%s", dstmask, sat);
371         break;
372     case 5:
373         if (dst_nr > 0)
374             fprintf(out, "bad destination reg oD%d\n", dst_nr);
375         sprintf(dstname, "oD%s%s",  dstmask, sat);
376         break;
377     case 6:
378         if (dst_nr > 3)
379             fprintf(out, "bad destination reg U%d\n", dst_nr);
380         sprintf(dstname, "U%d%s%s", dst_nr, dstmask, sat);
381         break;
382     default:
383         sprintf(dstname, "RESERVED");
384         break;
385     }
386 }
387
388 static char *
389 i915_get_channel_swizzle(uint32_t select)
390 {
391     switch (select & 0x7) {
392     case 0:
393         return (select & 8) ? "-x" : "x";
394     case 1:
395         return (select & 8) ? "-y" : "y";
396     case 2:
397         return (select & 8) ? "-z" : "z";
398     case 3:
399         return (select & 8) ? "-w" : "w";
400     case 4:
401         return (select & 8) ? "-0" : "0";
402     case 5:
403         return (select & 8) ? "-1" : "1";
404     default:
405         return (select & 8) ? "-bad" : "bad";
406     }
407 }
408
409 static void
410 i915_get_instruction_src_name(uint32_t src_type, uint32_t src_nr, char *name)
411 {
412     switch (src_type) {
413     case 0:
414         sprintf(name, "R%d", src_nr);
415         if (src_nr > 15)
416             fprintf(out, "bad src reg %s\n", name);
417         break;
418     case 1:
419         if (src_nr < 8)
420             sprintf(name, "T%d", src_nr);
421         else if (src_nr == 8)
422             sprintf(name, "DIFFUSE");
423         else if (src_nr == 9)
424             sprintf(name, "SPECULAR");
425         else if (src_nr == 10)
426             sprintf(name, "FOG");
427         else {
428             fprintf(out, "bad src reg T%d\n", src_nr);
429             sprintf(name, "RESERVED");
430         }
431         break;
432     case 2:
433         sprintf(name, "C%d", src_nr);
434         if (src_nr > 31)
435             fprintf(out, "bad src reg %s\n", name);
436         break;
437     case 4:
438         sprintf(name, "oC");
439         if (src_nr > 0)
440             fprintf(out, "bad src reg oC%d\n", src_nr);
441         break;
442     case 5:
443         sprintf(name, "oD");
444         if (src_nr > 0)
445             fprintf(out, "bad src reg oD%d\n", src_nr);
446         break;
447     case 6:
448         sprintf(name, "U%d", src_nr);
449         if (src_nr > 3)
450             fprintf(out, "bad src reg %s\n", name);
451         break;
452     default:
453         fprintf(out, "bad src reg type %d\n", src_type);
454         sprintf(name, "RESERVED");
455         break;
456     }
457 }
458
459 static void
460 i915_get_instruction_src0(uint32_t *data, int i, char *srcname)
461 {
462     uint32_t a0 = data[i];
463     uint32_t a1 = data[i + 1];
464     int src_nr = (a0 >> 2) & 0x1f;
465     char *swizzle_x = i915_get_channel_swizzle((a1 >> 28) & 0xf);
466     char *swizzle_y = i915_get_channel_swizzle((a1 >> 24) & 0xf);
467     char *swizzle_z = i915_get_channel_swizzle((a1 >> 20) & 0xf);
468     char *swizzle_w = i915_get_channel_swizzle((a1 >> 16) & 0xf);
469     char swizzle[100];
470
471     i915_get_instruction_src_name((a0 >> 7) & 0x7, src_nr, srcname);
472     sprintf(swizzle, ".%s%s%s%s", swizzle_x, swizzle_y, swizzle_z, swizzle_w);
473     if (strcmp(swizzle, ".xyzw") != 0)
474         strcat(srcname, swizzle);
475 }
476
477 static void
478 i915_get_instruction_src1(uint32_t *data, int i, char *srcname)
479 {
480     uint32_t a1 = data[i + 1];
481     uint32_t a2 = data[i + 2];
482     int src_nr = (a1 >> 8) & 0x1f;
483     char *swizzle_x = i915_get_channel_swizzle((a1 >> 4) & 0xf);
484     char *swizzle_y = i915_get_channel_swizzle((a1 >> 0) & 0xf);
485     char *swizzle_z = i915_get_channel_swizzle((a2 >> 28) & 0xf);
486     char *swizzle_w = i915_get_channel_swizzle((a2 >> 24) & 0xf);
487     char swizzle[100];
488
489     i915_get_instruction_src_name((a1 >> 13) & 0x7, src_nr, srcname);
490     sprintf(swizzle, ".%s%s%s%s", swizzle_x, swizzle_y, swizzle_z, swizzle_w);
491     if (strcmp(swizzle, ".xyzw") != 0)
492         strcat(srcname, swizzle);
493 }
494
495 static void
496 i915_get_instruction_src2(uint32_t *data, int i, char *srcname)
497 {
498     uint32_t a2 = data[i + 2];
499     int src_nr = (a2 >> 16) & 0x1f;
500     char *swizzle_x = i915_get_channel_swizzle((a2 >> 12) & 0xf);
501     char *swizzle_y = i915_get_channel_swizzle((a2 >> 8) & 0xf);
502     char *swizzle_z = i915_get_channel_swizzle((a2 >> 4) & 0xf);
503     char *swizzle_w = i915_get_channel_swizzle((a2 >> 0) & 0xf);
504     char swizzle[100];
505
506     i915_get_instruction_src_name((a2 >> 21) & 0x7, src_nr, srcname);
507     sprintf(swizzle, ".%s%s%s%s", swizzle_x, swizzle_y, swizzle_z, swizzle_w);
508     if (strcmp(swizzle, ".xyzw") != 0)
509         strcat(srcname, swizzle);
510 }
511
512 static void
513 i915_get_instruction_addr(uint32_t src_type, uint32_t src_nr, char *name)
514 {
515     switch (src_type) {
516     case 0:
517         sprintf(name, "R%d", src_nr);
518         if (src_nr > 15)
519             fprintf(out, "bad src reg %s\n", name);
520         break;
521     case 1:
522         if (src_nr < 8)
523             sprintf(name, "T%d", src_nr);
524         else if (src_nr == 8)
525             sprintf(name, "DIFFUSE");
526         else if (src_nr == 9)
527             sprintf(name, "SPECULAR");
528         else if (src_nr == 10)
529             sprintf(name, "FOG");
530         else {
531             fprintf(out, "bad src reg T%d\n", src_nr);
532             sprintf(name, "RESERVED");
533         }
534         break;
535     case 4:
536         sprintf(name, "oC");
537         if (src_nr > 0)
538             fprintf(out, "bad src reg oC%d\n", src_nr);
539         break;
540     case 5:
541         sprintf(name, "oD");
542         if (src_nr > 0)
543             fprintf(out, "bad src reg oD%d\n", src_nr);
544         break;
545     default:
546         fprintf(out, "bad src reg type %d\n", src_type);
547         sprintf(name, "RESERVED");
548         break;
549     }
550 }
551
552 static void
553 i915_decode_alu1(uint32_t *data, uint32_t hw_offset,
554                  int i, char *instr_prefix, char *op_name)
555 {
556     char dst[100], src0[100];
557
558     i915_get_instruction_dst(data, i, dst, 1);
559     i915_get_instruction_src0(data, i, src0);
560
561     instr_out(data, hw_offset, i++, "%s: %s %s, %s\n", instr_prefix,
562               op_name, dst, src0);
563     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
564     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
565 }
566
567 static void
568 i915_decode_alu2(uint32_t *data, uint32_t hw_offset,
569                  int i, char *instr_prefix, char *op_name)
570 {
571     char dst[100], src0[100], src1[100];
572
573     i915_get_instruction_dst(data, i, dst, 1);
574     i915_get_instruction_src0(data, i, src0);
575     i915_get_instruction_src1(data, i, src1);
576
577     instr_out(data, hw_offset, i++, "%s: %s %s, %s, %s\n", instr_prefix,
578               op_name, dst, src0, src1);
579     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
580     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
581 }
582
583 static void
584 i915_decode_alu3(uint32_t *data, uint32_t hw_offset,
585                  int i, char *instr_prefix, char *op_name)
586 {
587     char dst[100], src0[100], src1[100], src2[100];
588
589     i915_get_instruction_dst(data, i, dst, 1);
590     i915_get_instruction_src0(data, i, src0);
591     i915_get_instruction_src1(data, i, src1);
592     i915_get_instruction_src2(data, i, src2);
593
594     instr_out(data, hw_offset, i++, "%s: %s %s, %s, %s, %s\n", instr_prefix,
595               op_name, dst, src0, src1, src2);
596     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
597     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
598 }
599
600 static void
601 i915_decode_tex(uint32_t *data, uint32_t hw_offset, int i, char *instr_prefix,
602                 char *tex_name)
603 {
604     uint32_t t0 = data[i];
605     uint32_t t1 = data[i + 1];
606     char dst_name[100];
607     char addr_name[100];
608     int sampler_nr;
609
610     i915_get_instruction_dst(data, i, dst_name, 0);
611     i915_get_instruction_addr((t1 >> 24) & 0x7,
612                               (t1 >> 17) & 0xf,
613                               addr_name);
614     sampler_nr = t0 & 0xf;
615
616     instr_out(data, hw_offset, i++, "%s: %s %s, S%d, %s\n", instr_prefix,
617               tex_name, dst_name, sampler_nr, addr_name);
618     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
619     instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
620 }
621
622 static void
623 i915_decode_dcl(uint32_t *data, uint32_t hw_offset, int i, char *instr_prefix)
624 {
625     uint32_t d0 = data[i];
626     char *sampletype;
627     int dcl_nr = (d0 >> 14) & 0xf;
628     char *dcl_x = d0 & (1 << 10) ? "x" : "";
629     char *dcl_y = d0 & (1 << 11) ? "y" : "";
630     char *dcl_z = d0 & (1 << 12) ? "z" : "";
631     char *dcl_w = d0 & (1 << 13) ? "w" : "";
632     char dcl_mask[10];
633
634     switch ((d0 >> 19) & 0x3) {
635     case 1:
636         sprintf(dcl_mask, ".%s%s%s%s", dcl_x, dcl_y, dcl_z, dcl_w);
637         if (strcmp(dcl_mask, ".") == 0)
638             fprintf(out, "bad (empty) dcl mask\n");
639
640         if (dcl_nr > 10)
641             fprintf(out, "bad T%d dcl register number\n", dcl_nr);
642         if (dcl_nr < 8) {
643             if (strcmp(dcl_mask, ".x") != 0 &&
644                 strcmp(dcl_mask, ".xy") != 0 &&
645                 strcmp(dcl_mask, ".xz") != 0 &&
646                 strcmp(dcl_mask, ".w") != 0 &&
647                 strcmp(dcl_mask, ".xyzw") != 0) {
648                 fprintf(out, "bad T%d.%s dcl mask\n", dcl_nr, dcl_mask);
649             }
650             instr_out(data, hw_offset, i++, "%s: DCL T%d%s\n", instr_prefix,
651                       dcl_nr, dcl_mask);
652         } else {
653             if (strcmp(dcl_mask, ".xz") == 0)
654                 fprintf(out, "errataed bad dcl mask %s\n", dcl_mask);
655             else if (strcmp(dcl_mask, ".xw") == 0)
656                 fprintf(out, "errataed bad dcl mask %s\n", dcl_mask);
657             else if (strcmp(dcl_mask, ".xzw") == 0)
658                 fprintf(out, "errataed bad dcl mask %s\n", dcl_mask);
659
660             if (dcl_nr == 8) {
661                 instr_out(data, hw_offset, i++, "%s: DCL DIFFUSE%s\n", instr_prefix,
662                           dcl_mask);
663             } else if (dcl_nr == 9) {
664                 instr_out(data, hw_offset, i++, "%s: DCL SPECULAR%s\n", instr_prefix,
665                           dcl_mask);
666             } else if (dcl_nr == 10) {
667                 instr_out(data, hw_offset, i++, "%s: DCL FOG%s\n", instr_prefix,
668                           dcl_mask);
669             }
670         }
671         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
672         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
673         break;
674     case 3:
675         switch ((d0 >> 22) & 0x3) {
676         case 0:
677             sampletype = "2D";
678             break;
679         case 1:
680             sampletype = "CUBE";
681             break;
682         case 2:
683             sampletype = "3D";
684             break;
685         default:
686             sampletype = "RESERVED";
687             break;
688         }
689         if (dcl_nr > 15)
690             fprintf(out, "bad S%d dcl register number\n", dcl_nr);
691         instr_out(data, hw_offset, i++, "%s: DCL S%d %s\n", instr_prefix,
692                   dcl_nr, sampletype);
693         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
694         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
695         break;
696     default:
697         instr_out(data, hw_offset, i++, "%s: DCL RESERVED%d\n", instr_prefix, dcl_nr);
698         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
699         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
700     }
701 }
702
703 static void
704 i915_decode_instruction(uint32_t *data, uint32_t hw_offset,
705                         int i, char *instr_prefix)
706 {
707     switch ((data[i] >> 24) & 0x1f) {
708     case 0x0:
709         instr_out(data, hw_offset, i++, "%s: NOP\n", instr_prefix);
710         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
711         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
712         break;
713     case 0x01:
714         i915_decode_alu2(data, hw_offset, i, instr_prefix, "ADD");
715         break;
716     case 0x02:
717         i915_decode_alu1(data, hw_offset, i, instr_prefix, "MOV");
718         break;
719     case 0x03:
720         i915_decode_alu2(data, hw_offset, i, instr_prefix, "MUL");
721         break;
722     case 0x04:
723         i915_decode_alu3(data, hw_offset, i, instr_prefix, "MAD");
724         break;
725     case 0x05:
726         i915_decode_alu3(data, hw_offset, i, instr_prefix, "DP2ADD");
727         break;
728     case 0x06:
729         i915_decode_alu2(data, hw_offset, i, instr_prefix, "DP3");
730         break;
731     case 0x07:
732         i915_decode_alu2(data, hw_offset, i, instr_prefix, "DP4");
733         break;
734     case 0x08:
735         i915_decode_alu1(data, hw_offset, i, instr_prefix, "FRC");
736         break;
737     case 0x09:
738         i915_decode_alu1(data, hw_offset, i, instr_prefix, "RCP");
739         break;
740     case 0x0a:
741         i915_decode_alu1(data, hw_offset, i, instr_prefix, "RSQ");
742         break;
743     case 0x0b:
744         i915_decode_alu1(data, hw_offset, i, instr_prefix, "EXP");
745         break;
746     case 0x0c:
747         i915_decode_alu1(data, hw_offset, i, instr_prefix, "LOG");
748         break;
749     case 0x0d:
750         i915_decode_alu2(data, hw_offset, i, instr_prefix, "CMP");
751         break;
752     case 0x0e:
753         i915_decode_alu2(data, hw_offset, i, instr_prefix, "MIN");
754         break;
755     case 0x0f:
756         i915_decode_alu2(data, hw_offset, i, instr_prefix, "MAX");
757         break;
758     case 0x10:
759         i915_decode_alu1(data, hw_offset, i, instr_prefix, "FLR");
760         break;
761     case 0x11:
762         i915_decode_alu1(data, hw_offset, i, instr_prefix, "MOD");
763         break;
764     case 0x12:
765         i915_decode_alu1(data, hw_offset, i, instr_prefix, "TRC");
766         break;
767     case 0x13:
768         i915_decode_alu2(data, hw_offset, i, instr_prefix, "SGE");
769         break;
770     case 0x14:
771         i915_decode_alu2(data, hw_offset, i, instr_prefix, "SLT");
772         break;
773     case 0x15:
774         i915_decode_tex(data, hw_offset, i, instr_prefix, "TEXLD");
775         break;
776     case 0x16:
777         i915_decode_tex(data, hw_offset, i, instr_prefix, "TEXLDP");
778         break;
779     case 0x17:
780         i915_decode_tex(data, hw_offset, i, instr_prefix, "TEXLDB");
781         break;
782     case 0x19:
783         i915_decode_dcl(data, hw_offset, i, instr_prefix);
784         break;
785     default:
786         instr_out(data, hw_offset, i++, "%s: unknown\n", instr_prefix);
787         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
788         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
789         break;
790     }
791 }
792
793 static char *
794 decode_compare_func(uint32_t op)
795 {
796     switch (op&0x7) {
797     case 0: return "always";
798     case 1: return "never";
799     case 2: return "less";
800     case 3: return "equal";
801     case 4: return "lequal";
802     case 5: return "greater";
803     case 6: return "notequal";
804     case 7: return "gequal";
805     }
806     return "";
807 }
808
809 static char *
810 decode_stencil_op(uint32_t op)
811 {
812     switch (op&0x7) {
813     case 0: return "keep";
814     case 1: return "zero";
815     case 2: return "replace";
816     case 3: return "incr_sat";
817     case 4: return "decr_sat";
818     case 5: return "greater";
819     case 6: return "incr";
820     case 7: return "decr";
821     }
822     return "";
823 }
824
825 static char *
826 decode_blend_fact(uint32_t op)
827 {
828     switch (op&0xf) {
829     case 1: return "zero";
830     case 2: return "one";
831     case 3: return "src_colr";
832     case 4: return "inv_src_colr";
833     case 5: return "src_alpha";
834     case 6: return "inv_src_alpha";
835     case 7: return "dst_alpha";
836     case 8: return "inv_dst_alpha";
837     case 9: return "dst_colr";
838     case 10: return "inv_dst_colr";
839     case 11: return "src_alpha_sat";
840     case 12: return "cnst_colr";
841     case 13: return "inv_cnst_colr";
842     case 14: return "cnst_alpha";
843     case 15: return "inv_const_alpha";
844     }
845     return "";
846 }
847
848 static char *
849 decode_tex_coord_mode(uint32_t mode)
850 {
851     switch (mode&0x7) {
852     case 0: return "wrap";
853     case 1: return "mirror";
854     case 2: return "clamp_edge";
855     case 3: return "cube";
856     case 4: return "clamp_border";
857     case 5: return "mirror_once";
858     }
859     return "";
860 }
861
862 static char *
863 decode_sample_filter(uint32_t mode)
864 {
865     switch (mode&0x7) {
866     case 0: return "nearest";
867     case 1: return "linear";
868     case 2: return "anisotropic";
869     case 3: return "4x4_1";
870     case 4: return "4x4_2";
871     case 5: return "4x4_flat";
872     case 6: return "6x5_mono";
873     }
874     return "";
875 }
876
877 static int
878 decode_3d_1d(uint32_t *data, int count,
879              uint32_t hw_offset,
880              uint32_t devid,
881              int *failures)
882 {
883     unsigned int len, i, c, idx, word, map, sampler, instr;
884     char *format = "", *zformat, *type;
885     uint32_t opcode;
886
887     struct {
888         uint32_t opcode;
889         int i830_only;
890         int min_len;
891         int max_len;
892         char *name;
893     } opcodes_3d_1d[] = {
894         { 0x86, 0, 4, 4, "3DSTATE_CHROMA_KEY" },
895         { 0x88, 0, 2, 2, "3DSTATE_CONSTANT_BLEND_COLOR" },
896         { 0x99, 0, 2, 2, "3DSTATE_DEFAULT_DIFFUSE" },
897         { 0x9a, 0, 2, 2, "3DSTATE_DEFAULT_SPECULAR" },
898         { 0x98, 0, 2, 2, "3DSTATE_DEFAULT_Z" },
899         { 0x97, 0, 2, 2, "3DSTATE_DEPTH_OFFSET_SCALE" },
900         { 0x9d, 0, 65, 65, "3DSTATE_FILTER_COEFFICIENTS_4X4" },
901         { 0x9e, 0, 4, 4, "3DSTATE_MONO_FILTER" },
902         { 0x89, 0, 4, 4, "3DSTATE_FOG_MODE" },
903         { 0x8f, 0, 2, 16, "3DSTATE_MAP_PALLETE_LOAD_32" },
904         { 0x83, 0, 2, 2, "3DSTATE_SPAN_STIPPLE" },
905         { 0x8c, 1, 2, 2, "3DSTATE_MAP_COORD_TRANSFORM_I830" },
906         { 0x8b, 1, 2, 2, "3DSTATE_MAP_VERTEX_TRANSFORM_I830" },
907         { 0x8d, 1, 3, 3, "3DSTATE_W_STATE_I830" },
908         { 0x01, 1, 2, 2, "3DSTATE_COLOR_FACTOR_I830" },
909         { 0x02, 1, 2, 2, "3DSTATE_MAP_COORD_SETBIND_I830" },
910     }, *opcode_3d_1d;
911
912     opcode = (data[0] & 0x00ff0000) >> 16;
913
914     switch (opcode) {
915     case 0x07:
916         /* This instruction is unusual.  A 0 length means just 1 DWORD instead of
917          * 2.  The 0 length is specified in one place to be unsupported, but
918          * stated to be required in another, and 0 length LOAD_INDIRECTs appear
919          * to cause no harm at least.
920          */
921         instr_out(data, hw_offset, 0, "3DSTATE_LOAD_INDIRECT\n");
922         len = (data[0] & 0x000000ff) + 1;
923         i = 1;
924         if (data[0] & (0x01 << 8)) {
925             if (i + 2 >= count)
926                 BUFFER_FAIL(count, len, "3DSTATE_LOAD_INDIRECT");
927             instr_out(data, hw_offset, i++, "SIS.0\n");
928             instr_out(data, hw_offset, i++, "SIS.1\n");
929         }
930         if (data[0] & (0x02 << 8)) {
931             if (i + 1 >= count)
932                 BUFFER_FAIL(count, len, "3DSTATE_LOAD_INDIRECT");
933             instr_out(data, hw_offset, i++, "DIS.0\n");
934         }
935         if (data[0] & (0x04 << 8)) {
936             if (i + 2 >= count)
937                 BUFFER_FAIL(count, len, "3DSTATE_LOAD_INDIRECT");
938             instr_out(data, hw_offset, i++, "SSB.0\n");
939             instr_out(data, hw_offset, i++, "SSB.1\n");
940         }
941         if (data[0] & (0x08 << 8)) {
942             if (i + 2 >= count)
943                 BUFFER_FAIL(count, len, "3DSTATE_LOAD_INDIRECT");
944             instr_out(data, hw_offset, i++, "MSB.0\n");
945             instr_out(data, hw_offset, i++, "MSB.1\n");
946         }
947         if (data[0] & (0x10 << 8)) {
948             if (i + 2 >= count)
949                 BUFFER_FAIL(count, len, "3DSTATE_LOAD_INDIRECT");
950             instr_out(data, hw_offset, i++, "PSP.0\n");
951             instr_out(data, hw_offset, i++, "PSP.1\n");
952         }
953         if (data[0] & (0x20 << 8)) {
954             if (i + 2 >= count)
955                 BUFFER_FAIL(count, len, "3DSTATE_LOAD_INDIRECT");
956             instr_out(data, hw_offset, i++, "PSC.0\n");
957             instr_out(data, hw_offset, i++, "PSC.1\n");
958         }
959         if (len != i) {
960             fprintf(out, "Bad count in 3DSTATE_LOAD_INDIRECT\n");
961             (*failures)++;
962             return len;
963         }
964         return len;
965     case 0x04:
966         instr_out(data, hw_offset, 0, "3DSTATE_LOAD_STATE_IMMEDIATE_1\n");
967         len = (data[0] & 0x0000000f) + 2;
968         i = 1;
969         for (word = 0; word <= 8; word++) {
970             if (data[0] & (1 << (4 + word))) {
971                 if (i >= count)
972                     BUFFER_FAIL(count, len, "3DSTATE_LOAD_STATE_IMMEDIATE_1");
973
974                 /* save vertex state for decode */
975                 if (!IS_GEN2(devid)) {
976                         if (word == 2) {
977                                 saved_s2_set = 1;
978                                 saved_s2 = data[i];
979                         }
980                         if (word == 4) {
981                                 saved_s4_set = 1;
982                                 saved_s4 = data[i];
983                         }
984
985                         switch (word) {
986                         case 0:
987                                 instr_out(data, hw_offset, i, "S0: vbo offset: 0x%08x%s\n",
988                                           data[i]&(~1),data[i]&1?", auto cache invalidate disabled":"");
989                                 break;
990                         case 1:
991                                 instr_out(data, hw_offset, i, "S1: vertex width: %i, vertex pitch: %i\n",
992                                           (data[i]>>24)&0x3f,(data[i]>>16)&0x3f);
993                                 break;
994                         case 2:
995                                 instr_out(data, hw_offset, i, "S2: texcoord formats: ");
996                                 for (int tex_num = 0; tex_num < 8; tex_num++) {
997                                         switch((data[i]>>tex_num*4)&0xf) {
998                                         case 0: fprintf(out, "%i=2D ", tex_num); break;
999                                         case 1: fprintf(out, "%i=3D ", tex_num); break;
1000                                         case 2: fprintf(out, "%i=4D ", tex_num); break;
1001                                         case 3: fprintf(out, "%i=1D ", tex_num); break;
1002                                         case 4: fprintf(out, "%i=2D_16 ", tex_num); break;
1003                                         case 5: fprintf(out, "%i=4D_16 ", tex_num); break;
1004                                         case 0xf: fprintf(out, "%i=NP ", tex_num); break;
1005                                         }
1006                                 }
1007                                 fprintf(out, "\n");
1008
1009                                 break;
1010                         case 3:
1011                                 instr_out(data, hw_offset, i, "S3: not documented\n", word);
1012                                 break;
1013                         case 4:
1014                                 {
1015                                         char *cullmode = "";
1016                                         char *vfmt_xyzw = "";
1017                                         switch((data[i]>>13)&0x3) {
1018                                         case 0: cullmode = "both"; break;
1019                                         case 1: cullmode = "none"; break;
1020                                         case 2: cullmode = "cw"; break;
1021                                         case 3: cullmode = "ccw"; break;
1022                                         }
1023                                         switch(data[i] & (7<<6 | 1<<2)) {
1024                                         case 1<<6: vfmt_xyzw = "XYZ,"; break;
1025                                         case 2<<6: vfmt_xyzw = "XYZW,"; break;
1026                                         case 3<<6: vfmt_xyzw = "XY,"; break;
1027                                         case 4<<6: vfmt_xyzw = "XYW,"; break;
1028                                         case 1<<6 | 1<<2: vfmt_xyzw = "XYZF,"; break;
1029                                         case 2<<6 | 1<<2: vfmt_xyzw = "XYZWF,"; break;
1030                                         case 3<<6 | 1<<2: vfmt_xyzw = "XYF,"; break;
1031                                         case 4<<6 | 1<<2: vfmt_xyzw = "XYWF,"; break;
1032                                         }
1033                                         instr_out(data, hw_offset, i, "S4: point_width=%i, line_width=%.1f,"
1034                                                   "%s%s%s%s%s cullmode=%s, vfmt=%s%s%s%s%s%s "
1035                                                   "%s%s\n",
1036                                                   (data[i]>>23)&0x1ff,
1037                                                   ((data[i]>>19)&0xf) / 2.0,
1038                                                   data[i]&(0xf<<15)?" flatshade=":"",
1039                                                   data[i]&(1<<18)?"Alpha,":"",
1040                                                   data[i]&(1<<17)?"Fog,":"",
1041                                                   data[i]&(1<<16)?"Specular,":"",
1042                                                   data[i]&(1<<15)?"Color,":"",
1043                                                   cullmode,
1044                                                   data[i]&(1<<12)?"PointWidth,":"",
1045                                                   data[i]&(1<<11)?"SpecFog,":"",
1046                                                   data[i]&(1<<10)?"Color,":"",
1047                                                   data[i]&(1<<9)?"DepthOfs,":"",
1048                                                   vfmt_xyzw,
1049                                                   data[i]&(1<<9)?"FogParam,":"",
1050                                                   data[i]&(1<<5)?"force default diffuse, ":"",
1051                                                   data[i]&(1<<4)?"force default specular, ":"",
1052                                                   data[i]&(1<<3)?"local depth ofs enable, ":"",
1053                                                   data[i]&(1<<1)?"point sprite enable, ":"",
1054                                                   data[i]&(1<<0)?"line AA enable, ":"");
1055                                         break;
1056                                 }
1057                         case 5:
1058                                 {
1059                                         instr_out(data, hw_offset, i, "S5:%s%s%s%s%s"
1060                                                   "%s%s%s%s stencil_ref=0x%x, stencil_test=%s, "
1061                                                   "stencil_fail=%s, stencil_pass_z_fail=%s, "
1062                                                   "stencil_pass_z_pass=%s, %s%s%s%s\n",
1063                                                   data[i]&(0xf<<28)?" write_disable=":"",
1064                                                   data[i]&(1<<31)?"Alpha,":"",
1065                                                   data[i]&(1<<30)?"Red,":"",
1066                                                   data[i]&(1<<29)?"Green,":"",
1067                                                   data[i]&(1<<28)?"Blue,":"",
1068                                                   data[i]&(1<<27)?" force default point size,":"",
1069                                                   data[i]&(1<<26)?" last pixel enable,":"",
1070                                                   data[i]&(1<<25)?" global depth ofs enable,":"",
1071                                                   data[i]&(1<<24)?" fog enable,":"",
1072                                                   (data[i]>>16)&0xff,
1073                                                   decode_compare_func(data[i]>>13),
1074                                                   decode_stencil_op(data[i]>>10),
1075                                                   decode_stencil_op(data[i]>>7),
1076                                                   decode_stencil_op(data[i]>>4),
1077                                                   data[i]&(1<<3)?"stencil write enable, ":"",
1078                                                   data[i]&(1<<2)?"stencil test enable, ":"",
1079                                                   data[i]&(1<<1)?"color dither enable, ":"",
1080                                                   data[i]&(1<<0)?"logicop enable, ":"");
1081                                 }
1082                                 break;
1083                         case 6:
1084                                 instr_out(data, hw_offset, i, "S6: %salpha_test=%s, alpha_ref=0x%x, "
1085                                           "depth_test=%s, %ssrc_blnd_fct=%s, dst_blnd_fct=%s, "
1086                                           "%s%stristrip_provoking_vertex=%i\n",
1087                                           data[i]&(1<<31)?"alpha test enable, ":"",
1088                                           decode_compare_func(data[i]>>28),
1089                                           data[i]&(0xff<<20),
1090                                           decode_compare_func(data[i]>>16),
1091                                           data[i]&(1<<15)?"cbuf blend enable, ":"",
1092                                           decode_blend_fact(data[i]>>8),
1093                                           decode_blend_fact(data[i]>>4),
1094                                           data[i]&(1<<3)?"depth write enable, ":"",
1095                                           data[i]&(1<<2)?"cbuf write enable, ":"",
1096                                           data[i]&(0x3));
1097                                 break;
1098                         case 7:
1099                                 instr_out(data, hw_offset, i, "S7: depth offset constant: 0x%08x\n", data[i]);
1100                                 break;
1101                         }
1102                 } else {
1103                         instr_out(data, hw_offset, i, "S%d: 0x%08x\n", i, data[i]);
1104                 }
1105                 i++;
1106             }
1107         }
1108         if (len != i) {
1109             fprintf(out, "Bad count in 3DSTATE_LOAD_STATE_IMMEDIATE_1\n");
1110             (*failures)++;
1111         }
1112         return len;
1113     case 0x03:
1114         instr_out(data, hw_offset, 0, "3DSTATE_LOAD_STATE_IMMEDIATE_2\n");
1115         len = (data[0] & 0x0000000f) + 2;
1116         i = 1;
1117         for (word = 6; word <= 14; word++) {
1118             if (data[0] & (1 << word)) {
1119                 if (i >= count)
1120                     BUFFER_FAIL(count, len, "3DSTATE_LOAD_STATE_IMMEDIATE_2");
1121
1122                 if (word == 6)
1123                     instr_out(data, hw_offset, i++, "TBCF\n");
1124                 else if (word >= 7 && word <= 10) {
1125                     instr_out(data, hw_offset, i++, "TB%dC\n", word - 7);
1126                     instr_out(data, hw_offset, i++, "TB%dA\n", word - 7);
1127                 } else if (word >= 11 && word <= 14) {
1128                     instr_out(data, hw_offset, i, "TM%dS0: offset=0x%08x, %s\n",
1129                               word - 11,
1130                               data[i]&0xfffffffe,
1131                               data[i]&1?"use fence":"");
1132                     i++;
1133                     instr_out(data, hw_offset, i, "TM%dS1: height=%i, width=%i, %s\n",
1134                               word - 11,
1135                               data[i]>>21, (data[i]>>10)&0x3ff,
1136                               data[i]&2?(data[i]&1?"y-tiled":"x-tiled"):"");
1137                     i++;
1138                     instr_out(data, hw_offset, i, "TM%dS2: pitch=%i, \n",
1139                               word - 11,
1140                               ((data[i]>>21) + 1)*4);
1141                     i++;
1142                     instr_out(data, hw_offset, i++, "TM%dS3\n", word - 11);
1143                     instr_out(data, hw_offset, i++, "TM%dS4: dflt color\n", word - 11);
1144                 }
1145             }
1146         }
1147         if (len != i) {
1148             fprintf(out, "Bad count in 3DSTATE_LOAD_STATE_IMMEDIATE_2\n");
1149             (*failures)++;
1150         }
1151         return len;
1152     case 0x00:
1153         instr_out(data, hw_offset, 0, "3DSTATE_MAP_STATE\n");
1154         len = (data[0] & 0x0000003f) + 2;
1155         instr_out(data, hw_offset, 1, "mask\n");
1156
1157         i = 2;
1158         for (map = 0; map <= 15; map++) {
1159             if (data[1] & (1 << map)) {
1160                 int width, height, pitch, dword;
1161                 const char *tiling;
1162
1163                 if (i + 3 >= count)
1164                     BUFFER_FAIL(count, len, "3DSTATE_MAP_STATE");
1165
1166                 dword = data[i];
1167                 instr_out(data, hw_offset, i++, "map %d MS2 %s%s%s\n", map,
1168                           dword&(1<<31)?"untrusted surface, ":"",
1169                           dword&(1<<1)?"vertical line stride enable, ":"",
1170                           dword&(1<<0)?"vertical ofs enable, ":"");
1171
1172                 dword = data[i];
1173                 width = ((dword >> 10) & ((1 << 11) - 1))+1;
1174                 height = ((dword >> 21) & ((1 << 11) - 1))+1;
1175
1176                 tiling = "none";
1177                 if (dword & (1 << 2))
1178                         tiling = "fenced";
1179                 else if (dword & (1 << 1))
1180                         tiling = dword & (1 << 0) ? "Y" : "X";
1181                 type = " BAD";
1182                 switch ((dword>>7) & 0x7) {
1183                 case 1:
1184                     type = "8b";
1185                     switch ((dword>>3) & 0xf) {
1186                     case 0: format = "I"; break;
1187                     case 1: format = "L"; break;
1188                     case 2: format = "A"; break;
1189                     case 3: format = " mono"; break; }
1190                     break;
1191                 case 2:
1192                     type = "16b";
1193                     switch ((dword>>3) & 0xf) {
1194                     case 0: format = " rgb565"; break;
1195                     case 1: format = " argb1555"; break;
1196                     case 2: format = " argb4444"; break;
1197                     case 5: format = " ay88"; break;
1198                     case 6: format = " bump655"; break;
1199                     case 7: format = "I"; break;
1200                     case 8: format = "L"; break;
1201                     case 9: format = "A"; break; }
1202                     break;
1203                 case 3:
1204                     type = "32b";
1205                     switch ((dword>>3) & 0xf) {
1206                     case 0: format = " argb8888"; break;
1207                     case 1: format = " abgr8888"; break;
1208                     case 2: format = " xrgb8888"; break;
1209                     case 3: format = " xbgr8888"; break;
1210                     case 4: format = " qwvu8888"; break;
1211                     case 5: format = " axvu8888"; break;
1212                     case 6: format = " lxvu8888"; break;
1213                     case 7: format = " xlvu8888"; break;
1214                     case 8: format = " argb2101010"; break;
1215                     case 9: format = " abgr2101010"; break;
1216                     case 10: format = " awvu2101010"; break;
1217                     case 11: format = " gr1616"; break;
1218                     case 12: format = " vu1616"; break;
1219                     case 13: format = " xI824"; break;
1220                     case 14: format = " xA824"; break;
1221                     case 15: format = " xL824"; break; }
1222                     break;
1223                 case 5:
1224                     type = "422";
1225                     switch ((dword>>3) & 0xf) {
1226                     case 0: format = " yuv_swapy"; break;
1227                     case 1: format = " yuv"; break;
1228                     case 2: format = " yuv_swapuv"; break;
1229                     case 3: format = " yuv_swapuvy"; break; }
1230                     break;
1231                 case 6:
1232                     type = "compressed";
1233                     switch ((dword>>3) & 0x7) {
1234                     case 0: format = " dxt1"; break;
1235                     case 1: format = " dxt2_3"; break;
1236                     case 2: format = " dxt4_5"; break;
1237                     case 3: format = " fxt1"; break;
1238                     case 4: format = " dxt1_rb"; break; }
1239                     break;
1240                 case 7:
1241                     type = "4b indexed";
1242                     switch ((dword>>3) & 0xf) {
1243                     case 7: format = " argb8888"; break; }
1244                     break;
1245                 default:
1246                     format = "BAD";
1247                 }
1248                 dword = data[i];
1249                 instr_out(data, hw_offset, i++, "map %d MS3 [width=%d, height=%d, format=%s%s, tiling=%s%s]\n",
1250                           map, width, height, type, format, tiling,
1251                           dword&(1<<9)?" palette select":"");
1252
1253                 dword = data[i];
1254                 pitch = 4*(((dword >> 21) & ((1 << 11) - 1))+1);
1255                 instr_out(data, hw_offset, i++, "map %d MS4 [pitch=%d, max_lod=%i, vol_depth=%i, cube_face_ena=%x, %s]\n",
1256                           map, pitch,
1257                           (dword>>9)&0x3f, dword&0xff, (dword>>15)&0x3f,
1258                           dword&(1<<8)?"miplayout legacy":"miplayout right");
1259             }
1260         }
1261         if (len != i) {
1262             fprintf(out, "Bad count in 3DSTATE_MAP_STATE\n");
1263             (*failures)++;
1264             return len;
1265         }
1266         return len;
1267     case 0x06:
1268         instr_out(data, hw_offset, 0, "3DSTATE_PIXEL_SHADER_CONSTANTS\n");
1269         len = (data[0] & 0x000000ff) + 2;
1270
1271         i = 2;
1272         for (c = 0; c <= 31; c++) {
1273             if (data[1] & (1 << c)) {
1274                 if (i + 4 >= count)
1275                     BUFFER_FAIL(count, len, "3DSTATE_PIXEL_SHADER_CONSTANTS");
1276                 instr_out(data, hw_offset, i, "C%d.X = %f\n",
1277                           c, int_as_float(data[i]));
1278                 i++;
1279                 instr_out(data, hw_offset, i, "C%d.Y = %f\n",
1280                           c, int_as_float(data[i]));
1281                 i++;
1282                 instr_out(data, hw_offset, i, "C%d.Z = %f\n",
1283                           c, int_as_float(data[i]));
1284                 i++;
1285                 instr_out(data, hw_offset, i, "C%d.W = %f\n",
1286                           c, int_as_float(data[i]));
1287                 i++;
1288             }
1289         }
1290         if (len != i) {
1291             fprintf(out, "Bad count in 3DSTATE_PIXEL_SHADER_CONSTANTS\n");
1292             (*failures)++;
1293         }
1294         return len;
1295     case 0x05:
1296         instr_out(data, hw_offset, 0, "3DSTATE_PIXEL_SHADER_PROGRAM\n");
1297         len = (data[0] & 0x000000ff) + 2;
1298         if ((len - 1) % 3 != 0 || len > 370) {
1299             fprintf(out, "Bad count in 3DSTATE_PIXEL_SHADER_PROGRAM\n");
1300             (*failures)++;
1301         }
1302         i = 1;
1303         for (instr = 0; instr < (len - 1) / 3; instr++) {
1304             char instr_prefix[10];
1305
1306             if (i + 3 >= count)
1307                 BUFFER_FAIL(count, len, "3DSTATE_PIXEL_SHADER_PROGRAM");
1308             sprintf(instr_prefix, "PS%03d", instr);
1309             i915_decode_instruction(data, hw_offset, i, instr_prefix);
1310             i += 3;
1311         }
1312         return len;
1313     case 0x01:
1314         if (IS_GEN2(devid))
1315                 break;
1316         instr_out(data, hw_offset, 0, "3DSTATE_SAMPLER_STATE\n");
1317         instr_out(data, hw_offset, 1, "mask\n");
1318         len = (data[0] & 0x0000003f) + 2;
1319         i = 2;
1320         for (sampler = 0; sampler <= 15; sampler++) {
1321             if (data[1] & (1 << sampler)) {
1322                 uint32_t dword;
1323                 char *mip_filter = "";
1324                 if (i + 3 >= count)
1325                     BUFFER_FAIL(count, len, "3DSTATE_SAMPLER_STATE");
1326                 dword = data[i];
1327                 switch ((dword>>20)&0x3) {
1328                 case 0: mip_filter = "none"; break;
1329                 case 1: mip_filter = "nearest"; break;
1330                 case 3: mip_filter = "linear"; break;
1331                 }
1332                 instr_out(data, hw_offset, i++, "sampler %d SS2:%s%s%s "
1333                           "base_mip_level=%i, mip_filter=%s, mag_filter=%s, min_filter=%s "
1334                           "lod_bias=%.2f,%s max_aniso=%i, shadow_func=%s\n", sampler,
1335                           dword&(1<<31)?" reverse gamma,":"",
1336                           dword&(1<<30)?" packed2planar,":"",
1337                           dword&(1<<29)?" colorspace conversion,":"",
1338                           (dword>>22)&0x1f,
1339                           mip_filter,
1340                           decode_sample_filter(dword>>17),
1341                           decode_sample_filter(dword>>14),
1342                           ((dword>>5)&0x1ff)/(0x10*1.0),
1343                           dword&(1<<4)?" shadow,":"",
1344                           dword&(1<<3)?4:2,
1345                           decode_compare_func(dword));
1346                 dword = data[i];
1347                 instr_out(data, hw_offset, i++, "sampler %d SS3: min_lod=%.2f,%s "
1348                           "tcmode_x=%s, tcmode_y=%s, tcmode_z=%s,%s texmap_idx=%i,%s\n",
1349                           sampler, ((dword>>24)&0xff)/(0x10*1.0),
1350                           dword&(1<<17)?" kill pixel enable,":"",
1351                           decode_tex_coord_mode(dword>>12),
1352                           decode_tex_coord_mode(dword>>9),
1353                           decode_tex_coord_mode(dword>>6),
1354                           dword&(1<<5)?" normalized coords,":"",
1355                           (dword>>1)&0xf,
1356                           dword&(1<<0)?" deinterlacer,":"");
1357                 dword = data[i];
1358                 instr_out(data, hw_offset, i++, "sampler %d SS4: border color\n",
1359                           sampler, ((dword>>24)&0xff)/(0x10*1.0),
1360                           dword);
1361             }
1362         }
1363         if (len != i) {
1364             fprintf(out, "Bad count in 3DSTATE_SAMPLER_STATE\n");
1365             (*failures)++;
1366         }
1367         return len;
1368     case 0x85:
1369         len = (data[0] & 0x0000000f) + 2;
1370
1371         if (len != 2)
1372             fprintf(out, "Bad count in 3DSTATE_DEST_BUFFER_VARIABLES\n");
1373         if (count < 2)
1374             BUFFER_FAIL(count, len, "3DSTATE_DEST_BUFFER_VARIABLES");
1375
1376         instr_out(data, hw_offset, 0,
1377                   "3DSTATE_DEST_BUFFER_VARIABLES\n");
1378
1379         switch ((data[1] >> 8) & 0xf) {
1380         case 0x0: format = "g8"; break;
1381         case 0x1: format = "x1r5g5b5"; break;
1382         case 0x2: format = "r5g6b5"; break;
1383         case 0x3: format = "a8r8g8b8"; break;
1384         case 0x4: format = "ycrcb_swapy"; break;
1385         case 0x5: format = "ycrcb_normal"; break;
1386         case 0x6: format = "ycrcb_swapuv"; break;
1387         case 0x7: format = "ycrcb_swapuvy"; break;
1388         case 0x8: format = "a4r4g4b4"; break;
1389         case 0x9: format = "a1r5g5b5"; break;
1390         case 0xa: format = "a2r10g10b10"; break;
1391         default: format = "BAD"; break;
1392         }
1393         switch ((data[1] >> 2) & 0x3) {
1394         case 0x0: zformat = "u16"; break;
1395         case 0x1: zformat = "f16"; break;
1396         case 0x2: zformat = "u24x8"; break;
1397         default: zformat = "BAD"; break;
1398         }
1399         instr_out(data, hw_offset, 1, "%s format, %s depth format, early Z %sabled\n",
1400                   format, zformat,
1401                   (data[1] & (1 << 31)) ? "en" : "dis");
1402         return len;
1403
1404     case 0x8e:
1405         {
1406             const char *name, *tiling;
1407
1408             len = (data[0] & 0x0000000f) + 2;
1409             if (len != 3)
1410                 fprintf(out, "Bad count in 3DSTATE_BUFFER_INFO\n");
1411             if (count < 3)
1412                 BUFFER_FAIL(count, len, "3DSTATE_BUFFER_INFO");
1413
1414             switch((data[1] >> 24) & 0x7) {
1415             case 0x3: name = "color"; break;
1416             case 0x7: name = "depth"; break;
1417             default: name = "unknown"; break;
1418             }
1419
1420             tiling = "none";
1421             if (data[1] & (1 << 23))
1422                 tiling = "fenced";
1423             else if (data[1] & (1 << 22))
1424                 tiling = data[1] & (1 << 21) ? "Y" : "X";
1425
1426             instr_out(data, hw_offset, 0, "3DSTATE_BUFFER_INFO\n");
1427             instr_out(data, hw_offset, 1, "%s, tiling = %s, pitch=%d\n", name, tiling, data[1]&0xffff);
1428
1429             instr_out(data, hw_offset, 2, "address\n");
1430             return len;
1431         }
1432     case 0x81:
1433         len = (data[0] & 0x0000000f) + 2;
1434
1435         if (len != 3)
1436             fprintf(out, "Bad count in 3DSTATE_SCISSOR_RECTANGLE\n");
1437         if (count < 3)
1438             BUFFER_FAIL(count, len, "3DSTATE_SCISSOR_RECTANGLE");
1439
1440         instr_out(data, hw_offset, 0,
1441                   "3DSTATE_SCISSOR_RECTANGLE\n");
1442         instr_out(data, hw_offset, 1, "(%d,%d)\n",
1443                   data[1] & 0xffff, data[1] >> 16);
1444         instr_out(data, hw_offset, 2, "(%d,%d)\n",
1445                   data[2] & 0xffff, data[2] >> 16);
1446
1447         return len;
1448     case 0x80:
1449         len = (data[0] & 0x0000000f) + 2;
1450
1451         if (len != 5)
1452             fprintf(out, "Bad count in 3DSTATE_DRAWING_RECTANGLE\n");
1453         if (count < 5)
1454             BUFFER_FAIL(count, len, "3DSTATE_DRAWING_RECTANGLE");
1455
1456         instr_out(data, hw_offset, 0,
1457                   "3DSTATE_DRAWING_RECTANGLE\n");
1458         instr_out(data, hw_offset, 1, "%s\n",
1459                   data[1]&(1<<30)?"depth ofs disabled ":"");
1460         instr_out(data, hw_offset, 2, "(%d,%d)\n",
1461                   data[2] & 0xffff, data[2] >> 16);
1462         instr_out(data, hw_offset, 3, "(%d,%d)\n",
1463                   data[3] & 0xffff, data[3] >> 16);
1464         instr_out(data, hw_offset, 4, "(%d,%d)\n",
1465                   data[4] & 0xffff, data[4] >> 16);
1466
1467         return len;
1468     case 0x9c:
1469         len = (data[0] & 0x0000000f) + 2;
1470
1471         if (len != 7)
1472             fprintf(out, "Bad count in 3DSTATE_CLEAR_PARAMETERS\n");
1473         if (count < 7)
1474             BUFFER_FAIL(count, len, "3DSTATE_CLEAR_PARAMETERS");
1475
1476         instr_out(data, hw_offset, 0,
1477                   "3DSTATE_CLEAR_PARAMETERS\n");
1478         instr_out(data, hw_offset, 1, "prim_type=%s, clear=%s%s%s\n",
1479                   data[1]&(1<<16)?"CLEAR_RECT":"ZONE_INIT",
1480                   data[1]&(1<<2)?"color,":"",
1481                   data[1]&(1<<1)?"depth,":"",
1482                   data[1]&(1<<0)?"stencil,":"");
1483         instr_out(data, hw_offset, 2, "clear color\n");
1484         instr_out(data, hw_offset, 3, "clear depth/stencil\n");
1485         instr_out(data, hw_offset, 4, "color value (rgba8888)\n");
1486         instr_out(data, hw_offset, 5, "depth value %f\n",
1487                   int_as_float(data[5]));
1488         instr_out(data, hw_offset, 6, "clear stencil\n");
1489         return len;
1490     }
1491
1492     for (idx = 0; idx < ARRAY_SIZE(opcodes_3d_1d); idx++)
1493     {
1494         opcode_3d_1d = &opcodes_3d_1d[idx];
1495         if (opcode_3d_1d->i830_only && !IS_GEN2(devid))
1496             continue;
1497
1498         if (((data[0] & 0x00ff0000) >> 16) == opcode_3d_1d->opcode) {
1499             len = 1;
1500
1501             instr_out(data, hw_offset, 0, "%s\n", opcode_3d_1d->name);
1502             if (opcode_3d_1d->max_len > 1) {
1503                 len = (data[0] & 0x0000ffff) + 2;
1504                 if (len < opcode_3d_1d->min_len ||
1505                     len > opcode_3d_1d->max_len)
1506                 {
1507                     fprintf(out, "Bad count in %s\n",
1508                             opcode_3d_1d->name);
1509                     (*failures)++;
1510                 }
1511             }
1512
1513             for (i = 1; i < len; i++) {
1514                 if (i >= count)
1515                     BUFFER_FAIL(count, len,  opcode_3d_1d->name);
1516                 instr_out(data, hw_offset, i, "dword %d\n", i);
1517             }
1518
1519             return len;
1520         }
1521     }
1522
1523     instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_1d opcode = 0x%x\n", opcode);
1524     (*failures)++;
1525     return 1;
1526 }
1527
1528 static int
1529 decode_3d_primitive(uint32_t *data, int count, uint32_t hw_offset,
1530                     int *failures)
1531 {
1532     char immediate = (data[0] & (1 << 23)) == 0;
1533     unsigned int len, i, j, ret;
1534     char *primtype;
1535     int original_s2 = saved_s2;
1536     int original_s4 = saved_s4;
1537
1538     switch ((data[0] >> 18) & 0xf) {
1539     case 0x0: primtype = "TRILIST"; break;
1540     case 0x1: primtype = "TRISTRIP"; break;
1541     case 0x2: primtype = "TRISTRIP_REVERSE"; break;
1542     case 0x3: primtype = "TRIFAN"; break;
1543     case 0x4: primtype = "POLYGON"; break;
1544     case 0x5: primtype = "LINELIST"; break;
1545     case 0x6: primtype = "LINESTRIP"; break;
1546     case 0x7: primtype = "RECTLIST"; break;
1547     case 0x8: primtype = "POINTLIST"; break;
1548     case 0x9: primtype = "DIB"; break;
1549     case 0xa: primtype = "CLEAR_RECT"; saved_s4 = 3 << 6; saved_s2 = ~0; break;
1550     default: primtype = "unknown"; break;
1551     }
1552
1553     /* XXX: 3DPRIM_DIB not supported */
1554     if (immediate) {
1555         len = (data[0] & 0x0003ffff) + 2;
1556         instr_out(data, hw_offset, 0, "3DPRIMITIVE inline %s\n", primtype);
1557         if (count < len)
1558             BUFFER_FAIL(count, len,  "3DPRIMITIVE inline");
1559         if (!saved_s2_set || !saved_s4_set) {
1560             fprintf(out, "unknown vertex format\n");
1561             for (i = 1; i < len; i++) {
1562                 instr_out(data, hw_offset, i,
1563                           "           vertex data (%f float)\n",
1564                           int_as_float(data[i]));
1565             }
1566         } else {
1567             unsigned int vertex = 0;
1568             for (i = 1; i < len;) {
1569                 unsigned int tc;
1570
1571 #define VERTEX_OUT(fmt, ...) do {                                       \
1572     if (i < len)                                                        \
1573         instr_out(data, hw_offset, i, " V%d."fmt"\n", vertex, __VA_ARGS__); \
1574     else                                                                \
1575         fprintf(out, " missing data in V%d\n", vertex);                 \
1576     i++;                                                                \
1577 } while (0)
1578
1579                 VERTEX_OUT("X = %f", int_as_float(data[i]));
1580                 VERTEX_OUT("Y = %f", int_as_float(data[i]));
1581                 switch (saved_s4 >> 6 & 0x7) {
1582                 case 0x1:
1583                     VERTEX_OUT("Z = %f", int_as_float(data[i]));
1584                     break;
1585                 case 0x2:
1586                     VERTEX_OUT("Z = %f", int_as_float(data[i]));
1587                     VERTEX_OUT("W = %f", int_as_float(data[i]));
1588                     break;
1589                 case 0x3:
1590                     break;
1591                 case 0x4:
1592                     VERTEX_OUT("W = %f", int_as_float(data[i]));
1593                     break;
1594                 default:
1595                     fprintf(out, "bad S4 position mask\n");
1596                 }
1597
1598                 if (saved_s4 & (1 << 10)) {
1599                     VERTEX_OUT("color = (A=0x%02x, R=0x%02x, G=0x%02x, "
1600                                "B=0x%02x)",
1601                                data[i] >> 24,
1602                                (data[i] >> 16) & 0xff,
1603                                (data[i] >> 8) & 0xff,
1604                                data[i] & 0xff);
1605                 }
1606                 if (saved_s4 & (1 << 11)) {
1607                     VERTEX_OUT("spec = (A=0x%02x, R=0x%02x, G=0x%02x, "
1608                                "B=0x%02x)",
1609                                data[i] >> 24,
1610                                (data[i] >> 16) & 0xff,
1611                                (data[i] >> 8) & 0xff,
1612                                data[i] & 0xff);
1613                 }
1614                 if (saved_s4 & (1 << 12))
1615                     VERTEX_OUT("width = 0x%08x)", data[i]);
1616
1617                 for (tc = 0; tc <= 7; tc++) {
1618                     switch ((saved_s2 >> (tc * 4)) & 0xf) {
1619                     case 0x0:
1620                         VERTEX_OUT("T%d.X = %f", tc, int_as_float(data[i]));
1621                         VERTEX_OUT("T%d.Y = %f", tc, int_as_float(data[i]));
1622                         break;
1623                     case 0x1:
1624                         VERTEX_OUT("T%d.X = %f", tc, int_as_float(data[i]));
1625                         VERTEX_OUT("T%d.Y = %f", tc, int_as_float(data[i]));
1626                         VERTEX_OUT("T%d.Z = %f", tc, int_as_float(data[i]));
1627                         break;
1628                     case 0x2:
1629                         VERTEX_OUT("T%d.X = %f", tc, int_as_float(data[i]));
1630                         VERTEX_OUT("T%d.Y = %f", tc, int_as_float(data[i]));
1631                         VERTEX_OUT("T%d.Z = %f", tc, int_as_float(data[i]));
1632                         VERTEX_OUT("T%d.W = %f", tc, int_as_float(data[i]));
1633                         break;
1634                     case 0x3:
1635                         VERTEX_OUT("T%d.X = %f", tc, int_as_float(data[i]));
1636                         break;
1637                     case 0x4:
1638                         VERTEX_OUT("T%d.XY = 0x%08x half-float", tc, data[i]);
1639                         break;
1640                     case 0x5:
1641                         VERTEX_OUT("T%d.XY = 0x%08x half-float", tc, data[i]);
1642                         VERTEX_OUT("T%d.ZW = 0x%08x half-float", tc, data[i]);
1643                         break;
1644                     case 0xf:
1645                         break;
1646                     default:
1647                         fprintf(out, "bad S2.T%d format\n", tc);
1648                     }
1649                 }
1650                 vertex++;
1651             }
1652         }
1653
1654         ret = len;
1655     } else {
1656         /* indirect vertices */
1657         len = data[0] & 0x0000ffff; /* index count */
1658         if (data[0] & (1 << 17)) {
1659             /* random vertex access */
1660             if (count < (len + 1) / 2 + 1) {
1661                 BUFFER_FAIL(count, (len + 1) / 2 + 1,
1662                             "3DPRIMITIVE random indirect");
1663             }
1664             instr_out(data, hw_offset, 0,
1665                       "3DPRIMITIVE random indirect %s (%d)\n", primtype, len);
1666             if (len == 0) {
1667                 /* vertex indices continue until 0xffff is found */
1668                 for (i = 1; i < count; i++) {
1669                     if ((data[i] & 0xffff) == 0xffff) {
1670                         instr_out(data, hw_offset, i,
1671                                   "    indices: (terminator)\n");
1672                         ret = i;
1673                         goto out;
1674                     } else if ((data[i] >> 16) == 0xffff) {
1675                         instr_out(data, hw_offset, i,
1676                                   "    indices: 0x%04x, (terminator)\n",
1677                                   data[i] & 0xffff);
1678                         ret = i;
1679                         goto out;
1680                     } else {
1681                         instr_out(data, hw_offset, i,
1682                                   "    indices: 0x%04x, 0x%04x\n",
1683                                   data[i] & 0xffff, data[i] >> 16);
1684                     }
1685                 }
1686                 fprintf(out,
1687                         "3DPRIMITIVE: no terminator found in index buffer\n");
1688                 (*failures)++;
1689                 ret = count;
1690                 goto out;
1691             } else {
1692                 /* fixed size vertex index buffer */
1693                 for (j = 1, i = 0; i < len; i += 2, j++) {
1694                     if (i * 2 == len - 1) {
1695                         instr_out(data, hw_offset, j,
1696                                   "    indices: 0x%04x\n",
1697                                   data[j] & 0xffff);
1698                     } else {
1699                         instr_out(data, hw_offset, j,
1700                                   "    indices: 0x%04x, 0x%04x\n",
1701                                   data[j] & 0xffff, data[j] >> 16);
1702                     }
1703                 }
1704             }
1705             ret = (len + 1) / 2 + 1;
1706             goto out;
1707         } else {
1708             /* sequential vertex access */
1709             if (count < 2)
1710                 BUFFER_FAIL(count, 2, "3DPRIMITIVE seq indirect");
1711             instr_out(data, hw_offset, 0,
1712                       "3DPRIMITIVE sequential indirect %s, %d starting from "
1713                       "%d\n", primtype, len, data[1] & 0xffff);
1714             instr_out(data, hw_offset, 1, "           start\n");
1715             ret = 2;
1716             goto out;
1717         }
1718     }
1719
1720 out:
1721     saved_s2 = original_s2;
1722     saved_s4 = original_s4;
1723     return ret;
1724 }
1725
1726 static int
1727 decode_3d(uint32_t *data, int count, uint32_t hw_offset, uint32_t devid, int *failures)
1728 {
1729     uint32_t opcode;
1730     unsigned int idx;
1731
1732     struct {
1733         uint32_t opcode;
1734         int min_len;
1735         int max_len;
1736         char *name;
1737     } opcodes_3d[] = {
1738         { 0x06, 1, 1, "3DSTATE_ANTI_ALIASING" },
1739         { 0x08, 1, 1, "3DSTATE_BACKFACE_STENCIL_OPS" },
1740         { 0x09, 1, 1, "3DSTATE_BACKFACE_STENCIL_MASKS" },
1741         { 0x16, 1, 1, "3DSTATE_COORD_SET_BINDINGS" },
1742         { 0x15, 1, 1, "3DSTATE_FOG_COLOR" },
1743         { 0x0b, 1, 1, "3DSTATE_INDEPENDENT_ALPHA_BLEND" },
1744         { 0x0d, 1, 1, "3DSTATE_MODES_4" },
1745         { 0x0c, 1, 1, "3DSTATE_MODES_5" },
1746         { 0x07, 1, 1, "3DSTATE_RASTERIZATION_RULES" },
1747     }, *opcode_3d;
1748
1749     opcode = (data[0] & 0x1f000000) >> 24;
1750
1751     switch (opcode) {
1752     case 0x1f:
1753         return decode_3d_primitive(data, count, hw_offset, failures);
1754     case 0x1d:
1755         return decode_3d_1d(data, count, hw_offset, devid, failures);
1756     case 0x1c:
1757         return decode_3d_1c(data, count, hw_offset, failures);
1758     }
1759
1760     for (idx = 0; idx < ARRAY_SIZE(opcodes_3d); idx++) {
1761         opcode_3d = &opcodes_3d[idx];
1762         if (opcode == opcode_3d->opcode) {
1763             unsigned int len = 1, i;
1764
1765             instr_out(data, hw_offset, 0, "%s\n", opcode_3d->name);
1766             if (opcode_3d->max_len > 1) {
1767                 len = (data[0] & 0xff) + 2;
1768                 if (len < opcode_3d->min_len ||
1769                     len > opcode_3d->max_len)
1770                 {
1771                     fprintf(out, "Bad count in %s\n", opcode_3d->name);
1772                 }
1773             }
1774
1775             for (i = 1; i < len; i++) {
1776                 if (i >= count)
1777                     BUFFER_FAIL(count, len, opcode_3d->name);
1778                 instr_out(data, hw_offset, i, "dword %d\n", i);
1779             }
1780             return len;
1781         }
1782     }
1783
1784     instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d opcode = 0x%x\n", opcode);
1785     (*failures)++;
1786     return 1;
1787 }
1788
1789 static const char *
1790 get_965_surfacetype(unsigned int surfacetype)
1791 {
1792     switch (surfacetype) {
1793     case 0: return "1D";
1794     case 1: return "2D";
1795     case 2: return "3D";
1796     case 3: return "CUBE";
1797     case 4: return "BUFFER";
1798     case 7: return "NULL";
1799     default: return "unknown";
1800     }
1801 }
1802
1803 static const char *
1804 get_965_depthformat(unsigned int depthformat)
1805 {
1806     switch (depthformat) {
1807     case 0: return "s8_z24float";
1808     case 1: return "z32float";
1809     case 2: return "z24s8";
1810     case 5: return "z16";
1811     default: return "unknown";
1812     }
1813 }
1814
1815 static const char *
1816 get_965_element_component(uint32_t data, int component)
1817 {
1818     uint32_t component_control = (data >> (16 + (3 - component) * 4)) & 0x7;
1819
1820     switch (component_control) {
1821     case 0:
1822         return "nostore";
1823     case 1:
1824         switch (component) {
1825         case 0: return "X";
1826         case 1: return "Y";
1827         case 2: return "Z";
1828         case 3: return "W";
1829         default: return "fail";
1830         }
1831     case 2:
1832         return "0.0";
1833     case 3:
1834         return "1.0";
1835     case 4:
1836         return "0x1";
1837     case 5:
1838         return "VID";
1839     default:
1840         return "fail";
1841     }
1842 }
1843
1844 static const char *
1845 get_965_prim_type(uint32_t data)
1846 {
1847     uint32_t primtype = (data >> 10) & 0x1f;
1848
1849     switch (primtype) {
1850     case 0x01: return "point list";
1851     case 0x02: return "line list";
1852     case 0x03: return "line strip";
1853     case 0x04: return "tri list";
1854     case 0x05: return "tri strip";
1855     case 0x06: return "tri fan";
1856     case 0x07: return "quad list";
1857     case 0x08: return "quad strip";
1858     case 0x09: return "line list adj";
1859     case 0x0a: return "line strip adj";
1860     case 0x0b: return "tri list adj";
1861     case 0x0c: return "tri strip adj";
1862     case 0x0d: return "tri strip reverse";
1863     case 0x0e: return "polygon";
1864     case 0x0f: return "rect list";
1865     case 0x10: return "line loop";
1866     case 0x11: return "point list bf";
1867     case 0x12: return "line strip cont";
1868     case 0x13: return "line strip bf";
1869     case 0x14: return "line strip cont bf";
1870     case 0x15: return "tri fan no stipple";
1871     default: return "fail";
1872     }
1873 }
1874
1875 static int
1876 i965_decode_urb_fence(uint32_t *data, uint32_t hw_offset, int len, int count,
1877                       int *failures)
1878 {
1879         uint32_t vs_fence, clip_fence, gs_fence, sf_fence, vfe_fence, cs_fence;
1880
1881         if (len != 3)
1882             fprintf(out, "Bad count in URB_FENCE\n");
1883         if (count < 3)
1884             BUFFER_FAIL(count, len, "URB_FENCE");
1885
1886         vs_fence = data[1] & 0x3ff;
1887         gs_fence = (data[1] >> 10) & 0x3ff;
1888         clip_fence = (data[1] >> 20) & 0x3ff;
1889         sf_fence = data[2] & 0x3ff;
1890         vfe_fence = (data[2] >> 10) & 0x3ff;
1891         cs_fence = (data[2] >> 20) & 0x7ff;
1892
1893         instr_out(data, hw_offset, 0, "URB_FENCE: %s%s%s%s%s%s\n",
1894                         (data[0] >> 13) & 1 ? "cs " : "",
1895                         (data[0] >> 12) & 1 ? "vfe " : "",
1896                         (data[0] >> 11) & 1 ? "sf " : "",
1897                         (data[0] >> 10) & 1 ? "clip " : "",
1898                         (data[0] >> 9)  & 1 ? "gs " : "",
1899                         (data[0] >> 8)  & 1 ? "vs " : "");
1900         instr_out(data, hw_offset, 1,
1901                   "vs fence: %d, clip_fence: %d, gs_fence: %d\n",
1902                   vs_fence, clip_fence, gs_fence);
1903         instr_out(data, hw_offset, 2,
1904                   "sf fence: %d, vfe_fence: %d, cs_fence: %d\n",
1905                   sf_fence, vfe_fence, cs_fence);
1906         if (gs_fence < vs_fence)
1907             fprintf(out, "gs fence < vs fence!\n");
1908         if (clip_fence < gs_fence)
1909             fprintf(out, "clip fence < gs fence!\n");
1910         if (sf_fence < clip_fence)
1911             fprintf(out, "sf fence < clip fence!\n");
1912         if (cs_fence < sf_fence)
1913             fprintf(out, "cs fence < sf fence!\n");
1914
1915         return len;
1916 }
1917
1918 static void
1919 state_base_out(uint32_t *data, uint32_t hw_offset, unsigned int index,
1920                char *name)
1921 {
1922     if (data[index] & 1) {
1923         instr_out(data, hw_offset, index, "%s state base address 0x%08x\n",
1924                   name, data[index] & ~1);
1925     } else {
1926         instr_out(data, hw_offset, index, "%s state base not updated\n",
1927                   name);
1928     }
1929 }
1930
1931 static void
1932 state_max_out(uint32_t *data, uint32_t hw_offset, unsigned int index,
1933               char *name)
1934 {
1935     if (data[index] & 1) {
1936         if (data[index] == 1) {
1937             instr_out(data, hw_offset, index,
1938                       "%s state upper bound disabled\n", name);
1939         } else {
1940             instr_out(data, hw_offset, index, "%s state upper bound 0x%08x\n",
1941                       name, data[index] & ~1);
1942         }
1943     } else {
1944         instr_out(data, hw_offset, index, "%s state upper bound not updated\n",
1945                   name);
1946     }
1947 }
1948
1949 static int
1950 decode_3d_965(uint32_t *data, int count, uint32_t hw_offset, uint32_t devid, int *failures)
1951 {
1952     uint32_t opcode;
1953     unsigned int idx, len;
1954     int i, sba_len;
1955     char *desc1 = NULL;
1956
1957     struct {
1958         uint32_t opcode;
1959         int min_len;
1960         int max_len;
1961         char *name;
1962     } opcodes_3d[] = {
1963         { 0x6000, 3, 3, "URB_FENCE" },
1964         { 0x6001, 2, 2, "CS_URB_STATE" },
1965         { 0x6002, 2, 2, "CONSTANT_BUFFER" },
1966         { 0x6101, 6, 6, "STATE_BASE_ADDRESS" },
1967         { 0x6102, 2, 2 , "STATE_SIP" },
1968         { 0x6104, 1, 1, "3DSTATE_PIPELINE_SELECT" },
1969         { 0x680b, 1, 1, "3DSTATE_VF_STATISTICS" },
1970         { 0x6904, 1, 1, "3DSTATE_PIPELINE_SELECT" },
1971         { 0x7800, 7, 7, "3DSTATE_PIPELINED_POINTERS" },
1972         { 0x7801, 6, 6, "3DSTATE_BINDING_TABLE_POINTERS" },
1973         { 0x7808, 5, 257, "3DSTATE_VERTEX_BUFFERS" },
1974         { 0x7809, 3, 256, "3DSTATE_VERTEX_ELEMENTS" },
1975         { 0x780a, 3, 3, "3DSTATE_INDEX_BUFFER" },
1976         { 0x780b, 1, 1, "3DSTATE_VF_STATISTICS" },
1977         { 0x7900, 4, 4, "3DSTATE_DRAWING_RECTANGLE" },
1978         { 0x7901, 5, 5, "3DSTATE_CONSTANT_COLOR" },
1979         { 0x7905, 5, 7, "3DSTATE_DEPTH_BUFFER" },
1980         { 0x7906, 2, 2, "3DSTATE_POLY_STIPPLE_OFFSET" },
1981         { 0x7907, 33, 33, "3DSTATE_POLY_STIPPLE_PATTERN" },
1982         { 0x7908, 3, 3, "3DSTATE_LINE_STIPPLE" },
1983         { 0x7909, 2, 2, "3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP" },
1984         { 0x7909, 2, 2, "3DSTATE_CLEAR_PARAMS" },
1985         { 0x790a, 3, 3, "3DSTATE_AA_LINE_PARAMETERS" },
1986         { 0x790b, 4, 4, "3DSTATE_GS_SVB_INDEX" },
1987         { 0x790d, 3, 3, "3DSTATE_MULTISAMPLE" },
1988         { 0x7910, 2, 2, "3DSTATE_CLEAR_PARAMS" },
1989         { 0x7b00, 6, 6, "3DPRIMITIVE" },
1990         { 0x7802, 4, 4, "3DSTATE_SAMPLER_STATE_POINTERS" },
1991         { 0x7805, 3, 3, "3DSTATE_URB" },
1992         { 0x780d, 4, 4, "3DSTATE_VIEWPORT_STATE_POINTERS" },
1993         { 0x780e, 4, 4, "3DSTATE_CC_STATE_POINTERS" },
1994         { 0x780f, 2, 2, "3DSTATE_SCISSOR_STATE_POINTERS" },
1995         { 0x7810, 6, 6, "3DSTATE_VS_STATE" },
1996         { 0x7811, 7, 7, "3DSTATE_GS_STATE" },
1997         { 0x7812, 4, 4, "3DSTATE_CLIP_STATE" },
1998         { 0x7813, 20, 20, "3DSTATE_SF_STATE" },
1999         { 0x7814, 9, 9, "3DSTATE_WM_STATE" },
2000         { 0x7815, 5, 5, "3DSTATE_CONSTANT_VS_STATE" },
2001         { 0x7816, 5, 5, "3DSTATE_CONSTANT_GS_STATE" },
2002         { 0x7817, 5, 5, "3DSTATE_CONSTANT_PS_STATE" },
2003         { 0x7818, 2, 2, "3DSTATE_SAMPLE_MASK" },
2004    }, *opcode_3d;
2005
2006     len = (data[0] & 0x0000ffff) + 2;
2007
2008     opcode = (data[0] & 0xffff0000) >> 16;
2009     switch (opcode) {
2010     case 0x6000:
2011         len = (data[0] & 0x000000ff) + 2;
2012         return i965_decode_urb_fence(data, hw_offset, len, count, failures);
2013     case 0x6001:
2014         instr_out(data, hw_offset, 0, "CS_URB_STATE\n");
2015         instr_out(data, hw_offset, 1, "entry_size: %d [%d bytes], n_entries: %d\n",
2016                         (data[1] >> 4) & 0x1f,
2017                         (((data[1] >> 4) & 0x1f) + 1) * 64,
2018                         data[1] & 0x7);
2019         return len;
2020     case 0x6002:
2021         len = (data[0] & 0x000000ff) + 2;
2022         instr_out(data, hw_offset, 0, "CONSTANT_BUFFER: %s\n",
2023                         (data[0] >> 8) & 1 ? "valid" : "invalid");
2024         instr_out(data, hw_offset, 1, "offset: 0x%08x, length: %d bytes\n",
2025                         data[1] & ~0x3f, ((data[1] & 0x3f) + 1) * 64);
2026         return len;
2027     case 0x6101:
2028         if (IS_GEN6(devid))
2029             sba_len = 10;
2030         else if (IS_GEN5(devid))
2031             sba_len = 8;
2032         else
2033             sba_len = 6;
2034         if (len != sba_len)
2035             fprintf(out, "Bad count in STATE_BASE_ADDRESS\n");
2036         if (len != sba_len)
2037             BUFFER_FAIL(count, len, "STATE_BASE_ADDRESS");
2038
2039         i = 0;
2040         instr_out(data, hw_offset, 0,
2041                   "STATE_BASE_ADDRESS\n");
2042         i++;
2043
2044         state_base_out(data, hw_offset, i++, "general");
2045         state_base_out(data, hw_offset, i++, "surface");
2046         if (IS_GEN6(devid))
2047             state_base_out(data, hw_offset, i++, "dynamic");
2048         state_base_out(data, hw_offset, i++, "indirect");
2049         if (IS_GEN5(devid) || IS_GEN6(devid))
2050             state_base_out(data, hw_offset, i++, "instruction");
2051
2052         state_max_out(data, hw_offset, i++, "general");
2053         if (IS_GEN6(devid))
2054             state_max_out(data, hw_offset, i++, "dynamic");
2055         state_max_out(data, hw_offset, i++, "indirect");
2056         if (IS_GEN5(devid) || IS_GEN6(devid))
2057             state_max_out(data, hw_offset, i++, "instruction");
2058
2059         return len;
2060     case 0x7800:
2061         if (len != 7)
2062             fprintf(out, "Bad count in 3DSTATE_PIPELINED_POINTERS\n");
2063         if (count < 7)
2064             BUFFER_FAIL(count, len, "3DSTATE_PIPELINED_POINTERS");
2065
2066         instr_out(data, hw_offset, 0,
2067                   "3DSTATE_PIPELINED_POINTERS\n");
2068         instr_out(data, hw_offset, 1, "VS state\n");
2069         instr_out(data, hw_offset, 2, "GS state\n");
2070         instr_out(data, hw_offset, 3, "Clip state\n");
2071         instr_out(data, hw_offset, 4, "SF state\n");
2072         instr_out(data, hw_offset, 5, "WM state\n");
2073         instr_out(data, hw_offset, 6, "CC state\n");
2074         return len;
2075     case 0x7801:
2076         len = (data[0] & 0x000000ff) + 2;
2077         if (len != 6 && len != 4)
2078             fprintf(out, "Bad count in 3DSTATE_BINDING_TABLE_POINTERS\n");
2079         if (len == 6) {
2080             if (count < 6)
2081                 BUFFER_FAIL(count, len, "3DSTATE_BINDING_TABLE_POINTERS");
2082             instr_out(data, hw_offset, 0,
2083                       "3DSTATE_BINDING_TABLE_POINTERS\n");
2084             instr_out(data, hw_offset, 1, "VS binding table\n");
2085             instr_out(data, hw_offset, 2, "GS binding table\n");
2086             instr_out(data, hw_offset, 3, "Clip binding table\n");
2087             instr_out(data, hw_offset, 4, "SF binding table\n");
2088             instr_out(data, hw_offset, 5, "WM binding table\n");
2089         } else {
2090             if (count < 4)
2091                 BUFFER_FAIL(count, len, "3DSTATE_BINDING_TABLE_POINTERS");
2092
2093             instr_out(data, hw_offset, 0,
2094                       "3DSTATE_BINDING_TABLE_POINTERS: VS mod %d, "
2095                       "GS mod %d, PS mod %d\n",
2096                       (data[0] & (1 << 8)) != 0,
2097                       (data[0] & (1 << 9)) != 0,
2098                       (data[0] & (1 << 12)) != 0);
2099             instr_out(data, hw_offset, 1, "VS binding table\n");
2100             instr_out(data, hw_offset, 2, "GS binding table\n");
2101             instr_out(data, hw_offset, 3, "WM binding table\n");
2102         }
2103
2104         return len;
2105     case 0x7802:
2106         len = (data[0] & 0xff) + 2;
2107         if (len != 4)
2108             fprintf(out, "Bad count in 3DSTATE_SAMPLER_STATE_POINTERS\n");
2109         if (count < 4)
2110             BUFFER_FAIL(count, len, "3DSTATE_SAMPLER_STATE_POINTERS");
2111         instr_out(data, hw_offset, 0, "3DSTATE_SAMPLER_STATE_POINTERS: VS mod %d, "
2112                   "GS mod %d, PS mod %d\n",
2113                   (data[0] & (1 << 8)) != 0,
2114                   (data[0] & (1 << 9)) != 0,
2115                   (data[0] & (1 << 12)) != 0);
2116         instr_out(data, hw_offset, 1, "VS sampler state\n");
2117         instr_out(data, hw_offset, 2, "GS sampler state\n");
2118         instr_out(data, hw_offset, 3, "WM sampler state\n");
2119         return len;
2120     case 0x7805:
2121         len = (data[0] & 0xff) + 2;
2122         if (len != 3)
2123             fprintf(out, "Bad count in 3DSTATE_URB\n");
2124         if (count < 3)
2125             BUFFER_FAIL(count, len, "3DSTATE_URB");
2126         instr_out(data, hw_offset, 0, "3DSTATE_URB\n");
2127         instr_out(data, hw_offset, 1, "VS entries %d, alloc size %d (1024bit row)\n",
2128                         data[1] & 0xffff, ((data[1] >> 16) & 0x07f) + 1);
2129         instr_out(data, hw_offset, 2, "GS entries %d, alloc size %d (1024bit row)\n",
2130                         (data[2] >> 8) & 0x3ff, (data[2] & 7) + 1);
2131         return len;
2132
2133     case 0x7808:
2134         len = (data[0] & 0xff) + 2;
2135         if ((len - 1) % 4 != 0)
2136             fprintf(out, "Bad count in 3DSTATE_VERTEX_BUFFERS\n");
2137         if (count < len)
2138             BUFFER_FAIL(count, len, "3DSTATE_VERTEX_BUFFERS");
2139         instr_out(data, hw_offset, 0, "3DSTATE_VERTEX_BUFFERS\n");
2140
2141         for (i = 1; i < len;) {
2142             int idx, access;
2143             if (IS_GEN6(devid)) {
2144                 idx = 26;
2145                 access = 20;
2146             } else {
2147                 idx = 27;
2148                 access = 26;
2149             }
2150             instr_out(data, hw_offset, i, "buffer %d: %s, pitch %db\n",
2151                       data[i] >> idx,
2152                       data[i] & (1 << access) ? "random" : "sequential",
2153                       data[i] & 0x07ff);
2154             i++;
2155             instr_out(data, hw_offset, i++, "buffer address\n");
2156             instr_out(data, hw_offset, i++, "max index\n");
2157             instr_out(data, hw_offset, i++, "mbz\n");
2158         }
2159         return len;
2160
2161     case 0x7809:
2162         len = (data[0] & 0xff) + 2;
2163         if ((len + 1) % 2 != 0)
2164             fprintf(out, "Bad count in 3DSTATE_VERTEX_ELEMENTS\n");
2165         if (count < len)
2166             BUFFER_FAIL(count, len, "3DSTATE_VERTEX_ELEMENTS");
2167         instr_out(data, hw_offset, 0, "3DSTATE_VERTEX_ELEMENTS\n");
2168
2169         for (i = 1; i < len;) {
2170             instr_out(data, hw_offset, i, "buffer %d: %svalid, type 0x%04x, "
2171                       "src offset 0x%04x bytes\n",
2172                       data[i] >> (IS_GEN6(devid) ? 26 : 27),
2173                       data[i] & (1 << (IS_GEN6(devid) ? 25 : 26)) ? "" : "in",
2174                       (data[i] >> 16) & 0x1ff,
2175                       data[i] & 0x07ff);
2176             i++;
2177             instr_out(data, hw_offset, i, "(%s, %s, %s, %s), "
2178                       "dst offset 0x%02x bytes\n",
2179                       get_965_element_component(data[i], 0),
2180                       get_965_element_component(data[i], 1),
2181                       get_965_element_component(data[i], 2),
2182                       get_965_element_component(data[i], 3),
2183                       (data[i] & 0xff) * 4);
2184             i++;
2185         }
2186         return len;
2187
2188     case 0x780d:
2189         len = (data[0] & 0xff) + 2;
2190         if (len != 4)
2191             fprintf(out, "Bad count in 3DSTATE_VIEWPORT_STATE_POINTERS\n");
2192         if (count < len)
2193             BUFFER_FAIL(count, len, "3DSTATE_VIEWPORT_STATE_POINTERS");
2194         instr_out(data, hw_offset, 0, "3DSTATE_VIEWPORT_STATE_POINTERS\n");
2195         instr_out(data, hw_offset, 1, "clip\n");
2196         instr_out(data, hw_offset, 2, "sf\n");
2197         instr_out(data, hw_offset, 3, "cc\n");
2198         return len;
2199
2200     case 0x780a:
2201         len = (data[0] & 0xff) + 2;
2202         if (len != 3)
2203             fprintf(out, "Bad count in 3DSTATE_INDEX_BUFFER\n");
2204         if (count < len)
2205             BUFFER_FAIL(count, len, "3DSTATE_INDEX_BUFFER");
2206         instr_out(data, hw_offset, 0, "3DSTATE_INDEX_BUFFER\n");
2207         instr_out(data, hw_offset, 1, "beginning buffer address\n");
2208         instr_out(data, hw_offset, 2, "ending buffer address\n");
2209         return len;
2210
2211     case 0x780e:
2212         len = (data[0] & 0xff) + 2;
2213         if (len != 4)
2214             fprintf(out, "Bad count in 3DSTATE_CC_STATE_POINTERS\n");
2215         if (count < 4)
2216             BUFFER_FAIL(count, len, "3DSTATE_CC_STATE_POINTERS");
2217         instr_out(data, hw_offset, 0, "3DSTATE_CC_STATE_POINTERS\n");
2218         instr_out(data, hw_offset, 1, "blend change %d\n", data[1] & 1);
2219         instr_out(data, hw_offset, 2, "depth stencil change %d\n", data[2] & 1);
2220         instr_out(data, hw_offset, 3, "cc change %d\n", data[3] & 1);
2221         return len;
2222
2223     case 0x780f:
2224         len = (data[0] & 0xff) + 2;
2225         if (len != 2)
2226             fprintf(out, "Bad count in 3DSTATE_SCISSOR_POINTERS\n");
2227         if (count < 2)
2228             BUFFER_FAIL(count, len, "3DSTATE_SCISSOR_POINTERS");
2229         instr_out(data, hw_offset, 0, "3DSTATE_SCISSOR_POINTERS\n");
2230         instr_out(data, hw_offset, 1, "scissor rect offset\n");
2231         return len;
2232
2233     case 0x7810:
2234         len = (data[0] & 0xff) + 2;
2235         if (len != 6)
2236             fprintf(out, "Bad count in 3DSTATE_VS\n");
2237         if (count < 6)
2238             BUFFER_FAIL(count, len, "3DSTATE_VS");
2239         instr_out(data, hw_offset, 0, "3DSTATE_VS\n");
2240         instr_out(data, hw_offset, 1, "kernel pointer\n");
2241         instr_out(data, hw_offset, 2, "SPF=%d, VME=%d, Sampler Count %d, "
2242                   "Binding table count %d\n",
2243                   (data[2] >> 31) & 1,
2244                   (data[2] >> 30) & 1,
2245                   (data[2] >> 27) & 7,
2246                   (data[2] >> 18) & 0xff);
2247         instr_out(data, hw_offset, 3, "scratch offset\n");
2248         instr_out(data, hw_offset, 4, "Dispatch GRF start %d, VUE read length %d, "
2249                   "VUE read offset %d\n",
2250                   (data[4] >> 20) & 0x1f,
2251                   (data[4] >> 11) & 0x3f,
2252                   (data[4] >> 4) & 0x3f);
2253         instr_out(data, hw_offset, 5, "Max Threads %d, Vertex Cache %sable, "
2254                   "VS func %sable\n",
2255                   ((data[5] >> 25) & 0x7f) + 1,
2256                   (data[5] & (1 << 1)) != 0 ? "dis" : "en",
2257                   (data[5] & 1) != 0 ? "en" : "dis");
2258         return len;
2259
2260     case 0x7811:
2261         len = (data[0] & 0xff) + 2;
2262         if (len != 7)
2263             fprintf(out, "Bad count in 3DSTATE_GS\n");
2264         if (count < 7)
2265             BUFFER_FAIL(count, len, "3DSTATE_GS");
2266         instr_out(data, hw_offset, 0, "3DSTATE_GS\n");
2267         instr_out(data, hw_offset, 1, "kernel pointer\n");
2268         instr_out(data, hw_offset, 2, "SPF=%d, VME=%d, Sampler Count %d, "
2269                   "Binding table count %d\n",
2270                   (data[2] >> 31) & 1,
2271                   (data[2] >> 30) & 1,
2272                   (data[2] >> 27) & 7,
2273                   (data[2] >> 18) & 0xff);
2274         instr_out(data, hw_offset, 3, "scratch offset\n");
2275         instr_out(data, hw_offset, 4, "Dispatch GRF start %d, VUE read length %d, "
2276                   "VUE read offset %d\n",
2277                   (data[4] & 0xf),
2278                   (data[4] >> 11) & 0x3f,
2279                   (data[4] >> 4) & 0x3f);
2280         instr_out(data, hw_offset, 5, "Max Threads %d, Rendering %sable\n",
2281                   ((data[5] >> 25) & 0x7f) + 1,
2282                   (data[5] & (1 << 8)) != 0 ? "en" : "dis");
2283         instr_out(data, hw_offset, 6, "Reorder %sable, Discard Adjaceny %sable, "
2284                   "GS %sable\n",
2285                   (data[6] & (1 << 30)) != 0 ? "en" : "dis",
2286                   (data[6] & (1 << 29)) != 0 ? "en" : "dis",
2287                   (data[6] & (1 << 15)) != 0 ? "en" : "dis");
2288         return len;
2289
2290     case 0x7812:
2291         len = (data[0] & 0xff) + 2;
2292         if (len != 4)
2293             fprintf(out, "Bad count in 3DSTATE_CLIP\n");
2294         if (count < 4)
2295             BUFFER_FAIL(count, len, "3DSTATE_CLIP");
2296         instr_out(data, hw_offset, 0, "3DSTATE_CLIP\n");
2297         instr_out(data, hw_offset, 1, "UserClip distance cull test mask 0x%x\n",
2298                   data[1] & 0xff);
2299         instr_out(data, hw_offset, 2, "Clip %sable, API mode %s, Viewport XY test %sable, "
2300                   "Viewport Z test %sable, Guardband test %sable, Clip mode %d, "
2301                   "Perspective Divide %sable, Non-Perspective Barycentric %sable, "
2302                   "Tri Provoking %d, Line Provoking %d, Trifan Provoking %d\n",
2303                   (data[2] & (1 << 31)) != 0 ? "en" : "dis",
2304                   (data[2] & (1 << 30)) != 0 ? "D3D" : "OGL",
2305                   (data[2] & (1 << 28)) != 0 ? "en" : "dis",
2306                   (data[2] & (1 << 27)) != 0 ? "en" : "dis",
2307                   (data[2] & (1 << 26)) != 0 ? "en" : "dis",
2308                   (data[2] >> 13) & 7,
2309                   (data[2] & (1 << 9)) != 0 ? "dis" : "en",
2310                   (data[2] & (1 << 8)) != 0 ? "en" : "dis",
2311                   (data[2] >> 4) & 3,
2312                   (data[2] >> 2) & 3,
2313                   (data[2] & 3));
2314         instr_out(data, hw_offset, 3, "Min PointWidth %d, Max PointWidth %d, "
2315                   "Force Zero RTAIndex %sable, Max VPIndex %d\n",
2316                   (data[3] >> 17) & 0x7ff,
2317                   (data[3] >> 6) & 0x7ff,
2318                   (data[3] & (1 << 5)) != 0 ? "en" : "dis",
2319                   (data[3] & 0xf));
2320         return len;
2321
2322     case 0x7813:
2323         len = (data[0] & 0xff) + 2;
2324         if (len != 20)
2325             fprintf(out, "Bad count in 3DSTATE_SF\n");
2326         if (count < 20)
2327             BUFFER_FAIL(count, len, "3DSTATE_SF");
2328         instr_out(data, hw_offset, 0, "3DSTATE_SF\n");
2329         instr_out(data, hw_offset, 1, "Attrib Out %d, Attrib Swizzle %sable, VUE read length %d, "
2330                   "VUE read offset %d\n",
2331                   (data[1] >> 22) & 0x3f,
2332                   (data[1] & (1 << 21)) != 0 ? "en" : "dis",
2333                   (data[1] >> 11) & 0x1f,
2334                   (data[1] >> 4) & 0x3f);
2335         instr_out(data, hw_offset, 2, "Legacy Global DepthBias %sable, FrontFace fill %d, BF fill %d, "
2336                   "VP transform %sable, FrontWinding_%s\n",
2337                   (data[2] & (1 << 11)) != 0 ? "en" : "dis",
2338                   (data[2] >> 5) & 3,
2339                   (data[2] >> 3) & 3,
2340                   (data[2] & (1 << 1)) != 0 ? "en" : "dis",
2341                   (data[2] & 1) != 0 ? "CCW" : "CW");
2342         instr_out(data, hw_offset, 3, "AA %sable, CullMode %d, Scissor %sable, Multisample m ode %d\n",
2343                   (data[3] & (1 << 31)) != 0 ? "en" : "dis",
2344                   (data[3] >> 29) & 3,
2345                   (data[3] & (1 << 11)) != 0 ? "en" : "dis",
2346                   (data[3] >> 8) & 3);
2347         instr_out(data, hw_offset, 4, "Last Pixel %sable, SubPixel Precision %d, Use PixelWidth %d\n",
2348                   (data[4] & (1 << 31)) != 0 ? "en" : "dis",
2349                   (data[4] & (1 << 12)) != 0 ? 4 : 8,
2350                   (data[4] & (1 << 11)) != 0);
2351         instr_out(data, hw_offset, 5, "Global Depth Offset Constant %f\n", data[5]);
2352         instr_out(data, hw_offset, 6, "Global Depth Offset Scale %f\n", data[6]);
2353         instr_out(data, hw_offset, 7, "Global Depth Offset Clamp %f\n", data[7]);
2354         int i, j;
2355         for (i = 0, j = 0; i < 8; i++, j+=2)
2356             instr_out(data, hw_offset, i+8, "Attrib %d (Override %s%s%s%s, Const Source %d, Swizzle Select %d, "
2357                   "Source %d); Attrib %d (Override %s%s%s%s, Const Source %d, Swizzle Select %d, Source %d)\n",
2358                   j+1,
2359                   (data[8+i] & (1 << 31)) != 0 ? "W":"",
2360                   (data[8+i] & (1 << 30)) != 0 ? "Z":"",
2361                   (data[8+i] & (1 << 29)) != 0 ? "Y":"",
2362                   (data[8+i] & (1 << 28)) != 0 ? "X":"",
2363                   (data[8+i] >> 25) & 3, (data[8+i] >> 22) & 3,
2364                   (data[8+i] >> 16) & 0x1f,
2365                   j,
2366                   (data[8+i] & (1 << 15)) != 0 ? "W":"",
2367                   (data[8+i] & (1 << 14)) != 0 ? "Z":"",
2368                   (data[8+i] & (1 << 13)) != 0 ? "Y":"",
2369                   (data[8+i] & (1 << 12)) != 0 ? "X":"",
2370                   (data[8+i] >> 9) & 3, (data[8+i] >> 6) & 3,
2371                   (data[8+i] & 0x1f));
2372         instr_out(data, hw_offset, 16, "Point Sprite TexCoord Enable\n");
2373         instr_out(data, hw_offset, 17, "Const Interp Enable\n");
2374         instr_out(data, hw_offset, 18, "Attrib 7-0 WrapShortest Enable\n");
2375         instr_out(data, hw_offset, 19, "Attrib 15-8 WrapShortest Enable\n");
2376
2377         return len;
2378
2379     case 0x7814:
2380         len = (data[0] & 0xff) + 2;
2381         if (len != 9)
2382             fprintf(out, "Bad count in 3DSTATE_WM\n");
2383         if (count < 9)
2384             BUFFER_FAIL(count, len, "3DSTATE_WM");
2385         instr_out(data, hw_offset, 0, "3DSTATE_WM\n");
2386         instr_out(data, hw_offset, 1, "kernel start pointer 0\n");
2387         instr_out(data, hw_offset, 2, "SPF=%d, VME=%d, Sampler Count %d, "
2388                   "Binding table count %d\n",
2389                   (data[2] >> 31) & 1,
2390                   (data[2] >> 30) & 1,
2391                   (data[2] >> 27) & 7,
2392                   (data[2] >> 18) & 0xff);
2393         instr_out(data, hw_offset, 3, "scratch offset\n");
2394         instr_out(data, hw_offset, 4, "Depth Clear %d, Depth Resolve %d, HiZ Resolve %d, "
2395                   "Dispatch GRF start[0] %d, start[1] %d, start[2] %d\n",
2396                   (data[4] & (1 << 30)) != 0,
2397                   (data[4] & (1 << 28)) != 0,
2398                   (data[4] & (1 << 27)) != 0,
2399                   (data[4] >> 16) & 0x7f,
2400                   (data[4] >> 8) & 0x7f,
2401                   (data[4] & 0x7f));
2402         instr_out(data, hw_offset, 5, "MaxThreads %d, PS KillPixel %d, PS computed Z %d, "
2403                   "PS use sourceZ %d, Thread Dispatch %d, PS use sourceW %d, Dispatch32 %d, "
2404                   "Dispatch16 %d, Dispatch8 %d\n",
2405                   ((data[5] >> 25) & 0x7f) + 1,
2406                   (data[5] & (1 << 22)) != 0,
2407                   (data[5] & (1 << 21)) != 0,
2408                   (data[5] & (1 << 20)) != 0,
2409                   (data[5] & (1 << 19)) != 0,
2410                   (data[5] & (1 << 8)) != 0,
2411                   (data[5] & (1 << 2)) != 0,
2412                   (data[5] & (1 << 1)) != 0,
2413                   (data[5] & (1 << 0)) != 0);
2414         instr_out(data, hw_offset, 6, "Num SF output %d, Pos XY offset %d, ZW interp mode %d , "
2415                   "Barycentric interp mode 0x%x, Point raster rule %d, Multisample mode %d, "
2416                   "Multisample Dispatch mode %d\n",
2417                   (data[6] >> 20) & 0x3f,
2418                   (data[6] >> 18) & 3,
2419                   (data[6] >> 16) & 3,
2420                   (data[6] >> 10) & 0x3f,
2421                   (data[6] & (1 << 9)) != 0,
2422                   (data[6] >> 1) & 3,
2423                   (data[6] & 1));
2424         instr_out(data, hw_offset, 7, "kernel start pointer 1\n");
2425         instr_out(data, hw_offset, 8, "kernel start pointer 2\n");
2426
2427         return len;
2428
2429     case 0x7900:
2430         if (len != 4)
2431             fprintf(out, "Bad count in 3DSTATE_DRAWING_RECTANGLE\n");
2432         if (count < 4)
2433             BUFFER_FAIL(count, len, "3DSTATE_DRAWING_RECTANGLE");
2434
2435         instr_out(data, hw_offset, 0,
2436                   "3DSTATE_DRAWING_RECTANGLE\n");
2437         instr_out(data, hw_offset, 1, "top left: %d,%d\n",
2438                   data[1] & 0xffff,
2439                   (data[1] >> 16) & 0xffff);
2440         instr_out(data, hw_offset, 2, "bottom right: %d,%d\n",
2441                   data[2] & 0xffff,
2442                   (data[2] >> 16) & 0xffff);
2443         instr_out(data, hw_offset, 3, "origin: %d,%d\n",
2444                   (int)data[3] & 0xffff,
2445                   ((int)data[3] >> 16) & 0xffff);
2446
2447         return len;
2448
2449     case 0x7905:
2450         if (len < 5 || len > 7)
2451             fprintf(out, "Bad count in 3DSTATE_DEPTH_BUFFER\n");
2452         if (count < len)
2453             BUFFER_FAIL(count, len, "3DSTATE_DEPTH_BUFFER");
2454
2455         instr_out(data, hw_offset, 0,
2456                   "3DSTATE_DEPTH_BUFFER\n");
2457         if (IS_GEN5(devid) || IS_GEN6(devid))
2458             instr_out(data, hw_offset, 1, "%s, %s, pitch = %d bytes, %stiled, HiZ %d, Seperate Stencil %d\n",
2459                     get_965_surfacetype(data[1] >> 29),
2460                     get_965_depthformat((data[1] >> 18) & 0x7),
2461                     (data[1] & 0x0001ffff) + 1,
2462                     data[1] & (1 << 27) ? "" : "not ",
2463                     (data[1] & (1 << 22)) != 0,
2464                     (data[1] & (1 << 21)) != 0);
2465         else
2466             instr_out(data, hw_offset, 1, "%s, %s, pitch = %d bytes, %stiled\n",
2467                     get_965_surfacetype(data[1] >> 29),
2468                     get_965_depthformat((data[1] >> 18) & 0x7),
2469                     (data[1] & 0x0001ffff) + 1,
2470                     data[1] & (1 << 27) ? "" : "not ");
2471         instr_out(data, hw_offset, 2, "depth offset\n");
2472         instr_out(data, hw_offset, 3, "%dx%d\n",
2473                   ((data[3] & 0x0007ffc0) >> 6) + 1,
2474                   ((data[3] & 0xfff80000) >> 19) + 1);
2475         instr_out(data, hw_offset, 4, "volume depth\n");
2476         if (len >= 6)
2477             instr_out(data, hw_offset, 5, "\n");
2478         if (len >= 7) {
2479             if (IS_GEN6(devid))
2480                 instr_out(data, hw_offset, 6, "\n");
2481             else
2482                 instr_out(data, hw_offset, 6, "render target view extent\n");
2483         }
2484
2485
2486         return len;
2487
2488     case 0x7a00:
2489         if (IS_GEN6(devid)) {
2490                 int i;
2491                 len = (data[0] & 0xff) + 2;
2492                 if (len != 4 && len != 5)
2493                         fprintf(out, "Bad count in PIPE_CONTROL\n");
2494                 if (count < len)
2495                         BUFFER_FAIL(count, len, "PIPE_CONTROL");
2496
2497                 switch ((data[1] >> 14) & 0x3) {
2498                 case 0: desc1 = "no write"; break;
2499                 case 1: desc1 = "qword write"; break;
2500                 case 2: desc1 = "PS_DEPTH_COUNT write"; break;
2501                 case 3: desc1 = "TIMESTAMP write"; break;
2502                 }
2503                 instr_out(data, hw_offset, 0, "PIPE_CONTROL\n");
2504                 instr_out(data, hw_offset, 1,
2505                           "%s, %scs stall, %stlb invalidate, "
2506                           "%ssync gfdt, %sdepth stall, %sRC write flush, "
2507                           "%sinst flush, %sTC flush\n",
2508                           desc1,
2509                           data[1] & (1 << 20) ? "" : "no ",
2510                           data[1] & (1 << 18) ? "" : "no ",
2511                           data[1] & (1 << 17) ? "" : "no ",
2512                           data[1] & (1 << 13) ? "" : "no ",
2513                           data[1] & (1 << 12) ? "" : "no ",
2514                           data[1] & (1 << 11) ? "" : "no ",
2515                           data[1] & (1 << 10) ? "" : "no ");
2516                 if (len == 5) {
2517                     instr_out(data, hw_offset, 2, "destination address\n");
2518                     instr_out(data, hw_offset, 3, "immediate dword low\n");
2519                     instr_out(data, hw_offset, 4, "immediate dword high\n");
2520                 } else {
2521                     for (i = 2; i < len; i++) {
2522                         instr_out(data, hw_offset, i, "\n");
2523                     }
2524                 }
2525                 return len;
2526         } else {
2527                 len = (data[0] & 0xff) + 2;
2528                 if (len != 4)
2529                         fprintf(out, "Bad count in PIPE_CONTROL\n");
2530                 if (count < len)
2531                         BUFFER_FAIL(count, len, "PIPE_CONTROL");
2532
2533                 switch ((data[0] >> 14) & 0x3) {
2534                 case 0: desc1 = "no write"; break;
2535                 case 1: desc1 = "qword write"; break;
2536                 case 2: desc1 = "PS_DEPTH_COUNT write"; break;
2537                 case 3: desc1 = "TIMESTAMP write"; break;
2538                 }
2539                 instr_out(data, hw_offset, 0,
2540                           "PIPE_CONTROL: %s, %sdepth stall, %sRC write flush, "
2541                           "%sinst flush\n",
2542                           desc1,
2543                           data[0] & (1 << 13) ? "" : "no ",
2544                           data[0] & (1 << 12) ? "" : "no ",
2545                           data[0] & (1 << 11) ? "" : "no ");
2546                 instr_out(data, hw_offset, 1, "destination address\n");
2547                 instr_out(data, hw_offset, 2, "immediate dword low\n");
2548                 instr_out(data, hw_offset, 3, "immediate dword high\n");
2549                 return len;
2550         }
2551     case 0x7b00:
2552         len = (data[0] & 0xff) + 2;
2553         if (len != 6)
2554             fprintf(out, "Bad count in 3DPRIMITIVE\n");
2555         if (count < len)
2556             BUFFER_FAIL(count, len, "3DPRIMITIVE");
2557
2558         instr_out(data, hw_offset, 0,
2559                   "3DPRIMITIVE: %s %s\n",
2560                   get_965_prim_type(data[0]),
2561                   (data[0] & (1 << 15)) ? "random" : "sequential");
2562         instr_out(data, hw_offset, 1, "vertex count\n");
2563         instr_out(data, hw_offset, 2, "start vertex\n");
2564         instr_out(data, hw_offset, 3, "instance count\n");
2565         instr_out(data, hw_offset, 4, "start instance\n");
2566         instr_out(data, hw_offset, 5, "index bias\n");
2567         return len;
2568     }
2569
2570     for (idx = 0; idx < ARRAY_SIZE(opcodes_3d); idx++) {
2571         opcode_3d = &opcodes_3d[idx];
2572         if ((data[0] & 0xffff0000) >> 16 == opcode_3d->opcode) {
2573             unsigned int i;
2574             len = 1;
2575
2576             instr_out(data, hw_offset, 0, "%s\n", opcode_3d->name);
2577             if (opcode_3d->max_len > 1) {
2578                 len = (data[0] & 0xff) + 2;
2579                 if (len < opcode_3d->min_len ||
2580                     len > opcode_3d->max_len)
2581                 {
2582                     fprintf(out, "Bad count in %s\n", opcode_3d->name);
2583                 }
2584             }
2585
2586             for (i = 1; i < len; i++) {
2587                 if (i >= count)
2588                     BUFFER_FAIL(count, len, opcode_3d->name);
2589                 instr_out(data, hw_offset, i, "dword %d\n", i);
2590             }
2591             return len;
2592         }
2593     }
2594
2595     instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_965 opcode = 0x%x\n", opcode);
2596     (*failures)++;
2597     return 1;
2598 }
2599
2600 static int
2601 decode_3d_i830(uint32_t *data, int count, uint32_t hw_offset, uint32_t devid, int *failures)
2602 {
2603     unsigned int idx;
2604     uint32_t opcode;
2605
2606     struct {
2607         uint32_t opcode;
2608         int min_len;
2609         int max_len;
2610         char *name;
2611     } opcodes_3d[] = {
2612         { 0x02, 1, 1, "3DSTATE_MODES_3" },
2613         { 0x03, 1, 1, "3DSTATE_ENABLES_1"},
2614         { 0x04, 1, 1, "3DSTATE_ENABLES_2"},
2615         { 0x05, 1, 1, "3DSTATE_VFT0"},
2616         { 0x06, 1, 1, "3DSTATE_AA"},
2617         { 0x07, 1, 1, "3DSTATE_RASTERIZATION_RULES" },
2618         { 0x08, 1, 1, "3DSTATE_MODES_1" },
2619         { 0x09, 1, 1, "3DSTATE_STENCIL_TEST" },
2620         { 0x0a, 1, 1, "3DSTATE_VFT1"},
2621         { 0x0b, 1, 1, "3DSTATE_INDPT_ALPHA_BLEND" },
2622         { 0x0c, 1, 1, "3DSTATE_MODES_5" },
2623         { 0x0d, 1, 1, "3DSTATE_MAP_BLEND_OP" },
2624         { 0x0e, 1, 1, "3DSTATE_MAP_BLEND_ARG" },
2625         { 0x0f, 1, 1, "3DSTATE_MODES_2" },
2626         { 0x15, 1, 1, "3DSTATE_FOG_COLOR" },
2627         { 0x16, 1, 1, "3DSTATE_MODES_4" },
2628     }, *opcode_3d;
2629
2630     opcode = (data[0] & 0x1f000000) >> 24;
2631
2632     switch (opcode) {
2633     case 0x1f:
2634         return decode_3d_primitive(data, count, hw_offset, failures);
2635     case 0x1d:
2636         return decode_3d_1d(data, count, hw_offset, devid, failures);
2637     case 0x1c:
2638         return decode_3d_1c(data, count, hw_offset, failures);
2639     }
2640
2641     for (idx = 0; idx < ARRAY_SIZE(opcodes_3d); idx++) {
2642         opcode_3d = &opcodes_3d[idx];
2643         if ((data[0] & 0x1f000000) >> 24 == opcode_3d->opcode) {
2644             unsigned int len = 1, i;
2645
2646             instr_out(data, hw_offset, 0, "%s\n", opcode_3d->name);
2647             if (opcode_3d->max_len > 1) {
2648                 len = (data[0] & 0xff) + 2;
2649                 if (len < opcode_3d->min_len ||
2650                     len > opcode_3d->max_len)
2651                 {
2652                     fprintf(out, "Bad count in %s\n", opcode_3d->name);
2653                 }
2654             }
2655
2656             for (i = 1; i < len; i++) {
2657                 if (i >= count)
2658                     BUFFER_FAIL(count, len, opcode_3d->name);
2659                 instr_out(data, hw_offset, i, "dword %d\n", i);
2660             }
2661             return len;
2662         }
2663     }
2664
2665     instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_i830 opcode = 0x%x\n", opcode);
2666     (*failures)++;
2667     return 1;
2668 }
2669
2670 /**
2671  * Decodes an i830-i915 batch buffer, writing the output to stdout.
2672  *
2673  * \param data batch buffer contents
2674  * \param count number of DWORDs to decode in the batch buffer
2675  * \param hw_offset hardware address for the buffer
2676  */
2677 int
2678 intel_decode(uint32_t *data, int count,
2679              uint32_t hw_offset,
2680              uint32_t devid,
2681              uint32_t ignore_end_of_batchbuffer)
2682 {
2683     int ret;
2684     int index = 0;
2685     int failures = 0;
2686
2687     out = stdout;
2688
2689     while (index < count) {
2690         switch ((data[index] & 0xe0000000) >> 29) {
2691         case 0x0:
2692             ret = decode_mi(data + index, count - index,
2693                                hw_offset + index * 4, &failures);
2694
2695             /* If MI_BATCHBUFFER_END happened, then dump the rest of the
2696              * output in case we some day want it in debugging, but don't
2697              * decode it since it'll just confuse in the common case.
2698              */
2699             if (ret == -1) {
2700                 if (ignore_end_of_batchbuffer) {
2701                     index++;
2702                 } else {
2703                     for (index = index + 1; index < count; index++) {
2704                         instr_out(data, hw_offset, index, "\n");
2705                     }
2706                 }
2707             } else
2708                 index += ret;
2709             break;
2710         case 0x2:
2711             index += decode_2d(data + index, count - index,
2712                                hw_offset + index * 4, &failures);
2713             break;
2714         case 0x3:
2715             if (IS_965(devid)) {
2716                 index += decode_3d_965(data + index, count - index,
2717                                        hw_offset + index * 4,
2718                                        devid, &failures);
2719             } else if (IS_GEN3(devid)) {
2720                 index += decode_3d(data + index, count - index,
2721                                    hw_offset + index * 4,
2722                                    devid, &failures);
2723             } else {
2724                 index += decode_3d_i830(data + index, count - index,
2725                                         hw_offset + index * 4,
2726                                         devid, &failures);
2727             }
2728             break;
2729         default:
2730             instr_out(data, hw_offset, index, "UNKNOWN\n");
2731             failures++;
2732             index++;
2733             break;
2734         }
2735         fflush(out);
2736     }
2737
2738     return failures;
2739 }
2740
2741 void intel_decode_context_reset(void)
2742 {
2743     saved_s2_set = 0;
2744     saved_s4_set = 1;
2745 }
2746
2747 void intel_decode_context_set_head_tail(uint32_t head, uint32_t tail)
2748 {
2749         head_offset = head;
2750         tail_offset = tail;
2751 }