OSDN Git Service

intel: Plumb the context through the decode callchain.
[android-x86/external-libdrm.git] / intel / intel_decode.c
1 /*
2  * Copyright © 2009-2011 Intel Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23
24 #include <stdint.h>
25 #include <stdlib.h>
26 #include <stdio.h>
27 #include <stdbool.h>
28 #include <stdarg.h>
29 #include <string.h>
30
31 #include "intel_chipset.h"
32 #include "intel_bufmgr.h"
33
34 /* Struct for tracking drm_intel_decode state. */
35 struct drm_intel_decode {
36         /** stdio file where the output should land.  Defaults to stdout. */
37         FILE *out;
38
39         /** PCI device ID. */
40         uint32_t devid;
41
42         /** GPU address of the start of the current packet. */
43         uint32_t hw_offset;
44         /** CPU virtual address of the start of the current packet. */
45         uint32_t *data;
46         /** DWORDs of remaining batchbuffer data starting from the packet. */
47         uint32_t count;
48
49         /** GPU address of the start of the batchbuffer data. */
50         uint32_t base_hw_offset;
51         /** CPU Virtual address of the start of the batchbuffer data. */
52         uint32_t *base_data;
53         /** Number of DWORDs of batchbuffer data. */
54         uint32_t base_count;
55
56         /** @{
57          * GPU head and tail pointers, which will be noted in the dump, or ~0.
58          */
59         uint32_t head, tail;
60         /** @} */
61
62         /**
63          * Whether to dump the dwords after MI_BATCHBUFFER_END.
64          *
65          * This sometimes provides clues in corrupted batchbuffers,
66          * and is used by the intel-gpu-tools.
67          */
68         bool dump_past_end;
69 };
70
71 static FILE *out;
72 static uint32_t saved_s2 = 0, saved_s4 = 0;
73 static char saved_s2_set = 0, saved_s4_set = 0;
74 static uint32_t head_offset = 0xffffffff;       /* undefined */
75 static uint32_t tail_offset = 0xffffffff;       /* undefined */
76
77 #ifndef ARRAY_SIZE
78 #define ARRAY_SIZE(A) (sizeof(A)/sizeof(A[0]))
79 #endif
80
81 #define BUFFER_FAIL(_count, _len, _name) do {                   \
82     fprintf(out, "Buffer size too small in %s (%d < %d)\n",     \
83             (_name), (_count), (_len));                         \
84     return count;                                               \
85 } while (0)
86
87 static float int_as_float(uint32_t intval)
88 {
89         union intfloat {
90                 uint32_t i;
91                 float f;
92         } uval;
93
94         uval.i = intval;
95         return uval.f;
96 }
97
98 static void
99 instr_out(uint32_t *data, uint32_t hw_offset, unsigned int index,
100           const char *fmt, ...) __attribute__((format(__printf__, 4, 5)));
101
102 static void
103 instr_out(uint32_t *data, uint32_t hw_offset, unsigned int index,
104           const char *fmt, ...)
105 {
106         va_list va;
107         const char *parseinfo;
108         uint32_t offset = hw_offset + index * 4;
109
110         if (offset == head_offset)
111                 parseinfo = "HEAD";
112         else if (offset == tail_offset)
113                 parseinfo = "TAIL";
114         else
115                 parseinfo = "    ";
116
117         fprintf(out, "0x%08x: %s 0x%08x: %s", offset, parseinfo,
118                 data[index], index == 0 ? "" : "   ");
119         va_start(va, fmt);
120         vfprintf(out, fmt, va);
121         va_end(va);
122 }
123
124 static int
125 decode_mi(struct drm_intel_decode *ctx)
126 {
127         unsigned int opcode, len = -1;
128         const char *post_sync_op = "";
129         uint32_t *data = ctx->data;
130         uint32_t hw_offset = ctx->hw_offset;
131         uint32_t count = ctx->count;
132
133         struct {
134                 uint32_t opcode;
135                 int len_mask;
136                 unsigned int min_len;
137                 unsigned int max_len;
138                 const char *name;
139         } opcodes_mi[] = {
140                 { 0x08, 0, 1, 1, "MI_ARB_ON_OFF" },
141                 { 0x0a, 0, 1, 1, "MI_BATCH_BUFFER_END" },
142                 { 0x30, 0x3f, 3, 3, "MI_BATCH_BUFFER" },
143                 { 0x31, 0x3f, 2, 2, "MI_BATCH_BUFFER_START" },
144                 { 0x14, 0x3f, 3, 3, "MI_DISPLAY_BUFFER_INFO" },
145                 { 0x04, 0, 1, 1, "MI_FLUSH" },
146                 { 0x22, 0x1f, 3, 3, "MI_LOAD_REGISTER_IMM" },
147                 { 0x13, 0x3f, 2, 2, "MI_LOAD_SCAN_LINES_EXCL" },
148                 { 0x12, 0x3f, 2, 2, "MI_LOAD_SCAN_LINES_INCL" },
149                 { 0x00, 0, 1, 1, "MI_NOOP" },
150                 { 0x11, 0x3f, 2, 2, "MI_OVERLAY_FLIP" },
151                 { 0x07, 0, 1, 1, "MI_REPORT_HEAD" },
152                 { 0x18, 0x3f, 2, 2, "MI_SET_CONTEXT" },
153                 { 0x20, 0x3f, 3, 4, "MI_STORE_DATA_IMM" },
154                 { 0x21, 0x3f, 3, 4, "MI_STORE_DATA_INDEX" },
155                 { 0x24, 0x3f, 3, 3, "MI_STORE_REGISTER_MEM" },
156                 { 0x02, 0, 1, 1, "MI_USER_INTERRUPT" },
157                 { 0x03, 0, 1, 1, "MI_WAIT_FOR_EVENT" },
158                 { 0x16, 0x7f, 3, 3, "MI_SEMAPHORE_MBOX" },
159                 { 0x26, 0x1f, 3, 4, "MI_FLUSH_DW" },
160                 { 0x0b, 0, 1, 1, "MI_SUSPEND_FLUSH"},
161         };
162
163         /* check instruction length */
164         for (opcode = 0; opcode < sizeof(opcodes_mi) / sizeof(opcodes_mi[0]);
165              opcode++) {
166                 if ((data[0] & 0x1f800000) >> 23 == opcodes_mi[opcode].opcode) {
167                         len = 1;
168                         if (opcodes_mi[opcode].max_len > 1) {
169                                 len =
170                                     (data[0] & opcodes_mi[opcode].len_mask) + 2;
171                                 if (len < opcodes_mi[opcode].min_len
172                                     || len > opcodes_mi[opcode].max_len) {
173                                         fprintf(out,
174                                                 "Bad length (%d) in %s, [%d, %d]\n",
175                                                 len, opcodes_mi[opcode].name,
176                                                 opcodes_mi[opcode].min_len,
177                                                 opcodes_mi[opcode].max_len);
178                                 }
179                         }
180                         break;
181                 }
182         }
183
184         switch ((data[0] & 0x1f800000) >> 23) {
185         case 0x0a:
186                 instr_out(data, hw_offset, 0, "MI_BATCH_BUFFER_END\n");
187                 return -1;
188         case 0x16:
189                 instr_out(data, hw_offset, 0, "MI_SEMAPHORE_MBOX%s%s%s%s %u\n",
190                           data[0] & (1 << 22) ? " global gtt," : "",
191                           data[0] & (1 << 21) ? " update semaphore," : "",
192                           data[0] & (1 << 20) ? " compare semaphore," : "",
193                           data[0] & (1 << 18) ? " use compare reg" : "",
194                           (data[0] & (0x3 << 16)) >> 16);
195                 instr_out(data, hw_offset, 1, "value\n");
196                 instr_out(data, hw_offset, 2, "address\n");
197                 return len;
198         case 0x21:
199                 instr_out(data, hw_offset, 0, "MI_STORE_DATA_INDEX%s\n",
200                           data[0] & (1 << 21) ? " use per-process HWS," : "");
201                 instr_out(data, hw_offset, 1, "index\n");
202                 instr_out(data, hw_offset, 2, "dword\n");
203                 if (len == 4)
204                         instr_out(data, hw_offset, 3, "upper dword\n");
205                 return len;
206         case 0x00:
207                 if (data[0] & (1 << 22))
208                         instr_out(data, hw_offset, 0,
209                                   "MI_NOOP write NOPID reg, val=0x%x\n",
210                                   data[0] & ((1 << 22) - 1));
211                 else
212                         instr_out(data, hw_offset, 0, "MI_NOOP\n");
213                 return len;
214         case 0x26:
215                 switch (data[0] & (0x3 << 14)) {
216                 case (0 << 14):
217                         post_sync_op = "no write";
218                         break;
219                 case (1 << 14):
220                         post_sync_op = "write data";
221                         break;
222                 case (2 << 14):
223                         post_sync_op = "reserved";
224                         break;
225                 case (3 << 14):
226                         post_sync_op = "write TIMESTAMP";
227                         break;
228                 }
229                 instr_out(data, hw_offset, 0,
230                           "MI_FLUSH_DW%s%s%s%s post_sync_op='%s' %s%s\n",
231                           data[0] & (1 << 22) ?
232                           " enable protected mem (BCS-only)," : "",
233                           data[0] & (1 << 21) ? " store in hws," : "",
234                           data[0] & (1 << 18) ? " invalidate tlb," : "",
235                           data[0] & (1 << 17) ? " flush gfdt," : "",
236                           post_sync_op,
237                           data[0] & (1 << 8) ? " enable notify interrupt," : "",
238                           data[0] & (1 << 7) ?
239                           " invalidate video state (BCS-only)," : "");
240                 if (data[0] & (1 << 21))
241                         instr_out(data, hw_offset, 1, "hws index\n");
242                 else
243                         instr_out(data, hw_offset, 1, "address\n");
244                 instr_out(data, hw_offset, 2, "dword\n");
245                 if (len == 4)
246                         instr_out(data, hw_offset, 3, "upper dword\n");
247                 return len;
248         }
249
250         for (opcode = 0; opcode < sizeof(opcodes_mi) / sizeof(opcodes_mi[0]);
251              opcode++) {
252                 if ((data[0] & 0x1f800000) >> 23 == opcodes_mi[opcode].opcode) {
253                         unsigned int i;
254
255                         instr_out(data, hw_offset, 0, "%s\n",
256                                   opcodes_mi[opcode].name);
257                         for (i = 1; i < len; i++) {
258                                 if (i >= count)
259                                         BUFFER_FAIL(count, len,
260                                                     opcodes_mi[opcode].name);
261                                 instr_out(data, hw_offset, i, "dword %d\n", i);
262                         }
263
264                         return len;
265                 }
266         }
267
268         instr_out(data, hw_offset, 0, "MI UNKNOWN\n");
269         return 1;
270 }
271
272 static void
273 decode_2d_br00(uint32_t *data, uint32_t count, uint32_t hw_offset,
274                const char *cmd)
275 {
276         instr_out(data, hw_offset, 0,
277                   "%s (rgb %sabled, alpha %sabled, src tile %d, dst tile %d)\n",
278                   cmd,
279                   (data[count] & (1 << 20)) ? "en" : "dis",
280                   (data[count] & (1 << 21)) ? "en" : "dis",
281                   (data[count] >> 15) & 1, (data[count] >> 11) & 1);
282 }
283
284 static void decode_2d_br01(uint32_t *data, uint32_t count, uint32_t hw_offset)
285 {
286         const char *format;
287         switch ((data[count] >> 24) & 0x3) {
288         case 0:
289                 format = "8";
290                 break;
291         case 1:
292                 format = "565";
293                 break;
294         case 2:
295                 format = "1555";
296                 break;
297         case 3:
298                 format = "8888";
299                 break;
300         }
301
302         instr_out(data, hw_offset, count, "format %s, pitch %d, rop 0x%02x, "
303                   "clipping %sabled, %s%s \n",
304                   format,
305                   (short)(data[count] & 0xffff),
306                   (data[count] >> 16) & 0xff,
307                   data[count] & (1 << 30) ? "en" : "dis",
308                   data[count] & (1 << 31) ? "solid pattern enabled, " : "",
309                   data[count] & (1 << 31) ?
310                   "mono pattern transparency enabled, " : "");
311
312 }
313
314 static int
315 decode_2d(struct drm_intel_decode *ctx)
316 {
317         unsigned int opcode, len;
318         uint32_t *data = ctx->data;
319         uint32_t hw_offset = ctx->hw_offset;
320         uint32_t count = ctx->count;
321
322         struct {
323                 uint32_t opcode;
324                 unsigned int min_len;
325                 unsigned int max_len;
326                 const char *name;
327         } opcodes_2d[] = {
328                 { 0x40, 5, 5, "COLOR_BLT" },
329                 { 0x43, 6, 6, "SRC_COPY_BLT" },
330                 { 0x01, 8, 8, "XY_SETUP_BLT" },
331                 { 0x11, 9, 9, "XY_SETUP_MONO_PATTERN_SL_BLT" },
332                 { 0x03, 3, 3, "XY_SETUP_CLIP_BLT" },
333                 { 0x24, 2, 2, "XY_PIXEL_BLT" },
334                 { 0x25, 3, 3, "XY_SCANLINES_BLT" },
335                 { 0x26, 4, 4, "Y_TEXT_BLT" },
336                 { 0x31, 5, 134, "XY_TEXT_IMMEDIATE_BLT" },
337                 { 0x50, 6, 6, "XY_COLOR_BLT" },
338                 { 0x51, 6, 6, "XY_PAT_BLT" },
339                 { 0x76, 8, 8, "XY_PAT_CHROMA_BLT" },
340                 { 0x72, 7, 135, "XY_PAT_BLT_IMMEDIATE" },
341                 { 0x77, 9, 137, "XY_PAT_CHROMA_BLT_IMMEDIATE" },
342                 { 0x52, 9, 9, "XY_MONO_PAT_BLT" },
343                 { 0x59, 7, 7, "XY_MONO_PAT_FIXED_BLT" },
344                 { 0x53, 8, 8, "XY_SRC_COPY_BLT" },
345                 { 0x54, 8, 8, "XY_MONO_SRC_COPY_BLT" },
346                 { 0x71, 9, 137, "XY_MONO_SRC_COPY_IMMEDIATE_BLT" },
347                 { 0x55, 9, 9, "XY_FULL_BLT" },
348                 { 0x55, 9, 137, "XY_FULL_IMMEDIATE_PATTERN_BLT" },
349                 { 0x56, 9, 9, "XY_FULL_MONO_SRC_BLT" },
350                 { 0x75, 10, 138, "XY_FULL_MONO_SRC_IMMEDIATE_PATTERN_BLT" },
351                 { 0x57, 12, 12, "XY_FULL_MONO_PATTERN_BLT" },
352                 { 0x58, 12, 12, "XY_FULL_MONO_PATTERN_MONO_SRC_BLT"},
353         };
354
355         switch ((data[0] & 0x1fc00000) >> 22) {
356         case 0x25:
357                 instr_out(data, hw_offset, 0,
358                           "XY_SCANLINES_BLT (pattern seed (%d, %d), dst tile %d)\n",
359                           (data[0] >> 12) & 0x8,
360                           (data[0] >> 8) & 0x8, (data[0] >> 11) & 1);
361
362                 len = (data[0] & 0x000000ff) + 2;
363                 if (len != 3)
364                         fprintf(out, "Bad count in XY_SCANLINES_BLT\n");
365                 if (count < 3)
366                         BUFFER_FAIL(count, len, "XY_SCANLINES_BLT");
367
368                 instr_out(data, hw_offset, 1, "dest (%d,%d)\n",
369                           data[1] & 0xffff, data[1] >> 16);
370                 instr_out(data, hw_offset, 2, "dest (%d,%d)\n",
371                           data[2] & 0xffff, data[2] >> 16);
372                 return len;
373         case 0x01:
374                 decode_2d_br00(data, 0, hw_offset, "XY_SETUP_BLT");
375
376                 len = (data[0] & 0x000000ff) + 2;
377                 if (len != 8)
378                         fprintf(out, "Bad count in XY_SETUP_BLT\n");
379                 if (count < 8)
380                         BUFFER_FAIL(count, len, "XY_SETUP_BLT");
381
382                 decode_2d_br01(data, 1, hw_offset);
383                 instr_out(data, hw_offset, 2, "cliprect (%d,%d)\n",
384                           data[2] & 0xffff, data[2] >> 16);
385                 instr_out(data, hw_offset, 3, "cliprect (%d,%d)\n",
386                           data[3] & 0xffff, data[3] >> 16);
387                 instr_out(data, hw_offset, 4, "setup dst offset 0x%08x\n",
388                           data[4]);
389                 instr_out(data, hw_offset, 5, "setup background color\n");
390                 instr_out(data, hw_offset, 6, "setup foreground color\n");
391                 instr_out(data, hw_offset, 7, "color pattern offset\n");
392                 return len;
393         case 0x03:
394                 decode_2d_br00(data, 0, hw_offset, "XY_SETUP_CLIP_BLT");
395
396                 len = (data[0] & 0x000000ff) + 2;
397                 if (len != 3)
398                         fprintf(out, "Bad count in XY_SETUP_CLIP_BLT\n");
399                 if (count < 3)
400                         BUFFER_FAIL(count, len, "XY_SETUP_CLIP_BLT");
401
402                 instr_out(data, hw_offset, 1, "cliprect (%d,%d)\n",
403                           data[1] & 0xffff, data[2] >> 16);
404                 instr_out(data, hw_offset, 2, "cliprect (%d,%d)\n",
405                           data[2] & 0xffff, data[3] >> 16);
406                 return len;
407         case 0x11:
408                 decode_2d_br00(data, 0, hw_offset,
409                                "XY_SETUP_MONO_PATTERN_SL_BLT");
410
411                 len = (data[0] & 0x000000ff) + 2;
412                 if (len != 9)
413                         fprintf(out,
414                                 "Bad count in XY_SETUP_MONO_PATTERN_SL_BLT\n");
415                 if (count < 9)
416                         BUFFER_FAIL(count, len, "XY_SETUP_MONO_PATTERN_SL_BLT");
417
418                 decode_2d_br01(data, 1, hw_offset);
419                 instr_out(data, hw_offset, 2, "cliprect (%d,%d)\n",
420                           data[2] & 0xffff, data[2] >> 16);
421                 instr_out(data, hw_offset, 3, "cliprect (%d,%d)\n",
422                           data[3] & 0xffff, data[3] >> 16);
423                 instr_out(data, hw_offset, 4, "setup dst offset 0x%08x\n",
424                           data[4]);
425                 instr_out(data, hw_offset, 5, "setup background color\n");
426                 instr_out(data, hw_offset, 6, "setup foreground color\n");
427                 instr_out(data, hw_offset, 7, "mono pattern dw0\n");
428                 instr_out(data, hw_offset, 8, "mono pattern dw1\n");
429                 return len;
430         case 0x50:
431                 decode_2d_br00(data, 0, hw_offset, "XY_COLOR_BLT");
432
433                 len = (data[0] & 0x000000ff) + 2;
434                 if (len != 6)
435                         fprintf(out, "Bad count in XY_COLOR_BLT\n");
436                 if (count < 6)
437                         BUFFER_FAIL(count, len, "XY_COLOR_BLT");
438
439                 decode_2d_br01(data, 1, hw_offset);
440                 instr_out(data, hw_offset, 2, "(%d,%d)\n",
441                           data[2] & 0xffff, data[2] >> 16);
442                 instr_out(data, hw_offset, 3, "(%d,%d)\n",
443                           data[3] & 0xffff, data[3] >> 16);
444                 instr_out(data, hw_offset, 4, "offset 0x%08x\n", data[4]);
445                 instr_out(data, hw_offset, 5, "color\n");
446                 return len;
447         case 0x53:
448                 decode_2d_br00(data, 0, hw_offset, "XY_SRC_COPY_BLT");
449
450                 len = (data[0] & 0x000000ff) + 2;
451                 if (len != 8)
452                         fprintf(out, "Bad count in XY_SRC_COPY_BLT\n");
453                 if (count < 8)
454                         BUFFER_FAIL(count, len, "XY_SRC_COPY_BLT");
455
456                 decode_2d_br01(data, 1, hw_offset);
457                 instr_out(data, hw_offset, 2, "dst (%d,%d)\n",
458                           data[2] & 0xffff, data[2] >> 16);
459                 instr_out(data, hw_offset, 3, "dst (%d,%d)\n",
460                           data[3] & 0xffff, data[3] >> 16);
461                 instr_out(data, hw_offset, 4, "dst offset 0x%08x\n", data[4]);
462                 instr_out(data, hw_offset, 5, "src (%d,%d)\n",
463                           data[5] & 0xffff, data[5] >> 16);
464                 instr_out(data, hw_offset, 6, "src pitch %d\n",
465                           (short)(data[6] & 0xffff));
466                 instr_out(data, hw_offset, 7, "src offset 0x%08x\n", data[7]);
467                 return len;
468         }
469
470         for (opcode = 0; opcode < sizeof(opcodes_2d) / sizeof(opcodes_2d[0]);
471              opcode++) {
472                 if ((data[0] & 0x1fc00000) >> 22 == opcodes_2d[opcode].opcode) {
473                         unsigned int i;
474
475                         len = 1;
476                         instr_out(data, hw_offset, 0, "%s\n",
477                                   opcodes_2d[opcode].name);
478                         if (opcodes_2d[opcode].max_len > 1) {
479                                 len = (data[0] & 0x000000ff) + 2;
480                                 if (len < opcodes_2d[opcode].min_len ||
481                                     len > opcodes_2d[opcode].max_len) {
482                                         fprintf(out, "Bad count in %s\n",
483                                                 opcodes_2d[opcode].name);
484                                 }
485                         }
486
487                         for (i = 1; i < len; i++) {
488                                 if (i >= count)
489                                         BUFFER_FAIL(count, len,
490                                                     opcodes_2d[opcode].name);
491                                 instr_out(data, hw_offset, i, "dword %d\n", i);
492                         }
493
494                         return len;
495                 }
496         }
497
498         instr_out(data, hw_offset, 0, "2D UNKNOWN\n");
499         return 1;
500 }
501
502 static int
503 decode_3d_1c(struct drm_intel_decode *ctx)
504 {
505         uint32_t *data = ctx->data;
506         uint32_t hw_offset = ctx->hw_offset;
507         uint32_t opcode;
508
509         opcode = (data[0] & 0x00f80000) >> 19;
510
511         switch (opcode) {
512         case 0x11:
513                 instr_out(data, hw_offset, 0,
514                           "3DSTATE_DEPTH_SUBRECTANGLE_DISABLE\n");
515                 return 1;
516         case 0x10:
517                 instr_out(data, hw_offset, 0, "3DSTATE_SCISSOR_ENABLE %s\n",
518                           data[0] & 1 ? "enabled" : "disabled");
519                 return 1;
520         case 0x01:
521                 instr_out(data, hw_offset, 0, "3DSTATE_MAP_COORD_SET_I830\n");
522                 return 1;
523         case 0x0a:
524                 instr_out(data, hw_offset, 0, "3DSTATE_MAP_CUBE_I830\n");
525                 return 1;
526         case 0x05:
527                 instr_out(data, hw_offset, 0, "3DSTATE_MAP_TEX_STREAM_I830\n");
528                 return 1;
529         }
530
531         instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_1c opcode = 0x%x\n",
532                   opcode);
533         return 1;
534 }
535
536 /** Sets the string dstname to describe the destination of the PS instruction */
537 static void
538 i915_get_instruction_dst(uint32_t *data, int i, char *dstname, int do_mask)
539 {
540         uint32_t a0 = data[i];
541         int dst_nr = (a0 >> 14) & 0xf;
542         char dstmask[8];
543         const char *sat;
544
545         if (do_mask) {
546                 if (((a0 >> 10) & 0xf) == 0xf) {
547                         dstmask[0] = 0;
548                 } else {
549                         int dstmask_index = 0;
550
551                         dstmask[dstmask_index++] = '.';
552                         if (a0 & (1 << 10))
553                                 dstmask[dstmask_index++] = 'x';
554                         if (a0 & (1 << 11))
555                                 dstmask[dstmask_index++] = 'y';
556                         if (a0 & (1 << 12))
557                                 dstmask[dstmask_index++] = 'z';
558                         if (a0 & (1 << 13))
559                                 dstmask[dstmask_index++] = 'w';
560                         dstmask[dstmask_index++] = 0;
561                 }
562
563                 if (a0 & (1 << 22))
564                         sat = ".sat";
565                 else
566                         sat = "";
567         } else {
568                 dstmask[0] = 0;
569                 sat = "";
570         }
571
572         switch ((a0 >> 19) & 0x7) {
573         case 0:
574                 if (dst_nr > 15)
575                         fprintf(out, "bad destination reg R%d\n", dst_nr);
576                 sprintf(dstname, "R%d%s%s", dst_nr, dstmask, sat);
577                 break;
578         case 4:
579                 if (dst_nr > 0)
580                         fprintf(out, "bad destination reg oC%d\n", dst_nr);
581                 sprintf(dstname, "oC%s%s", dstmask, sat);
582                 break;
583         case 5:
584                 if (dst_nr > 0)
585                         fprintf(out, "bad destination reg oD%d\n", dst_nr);
586                 sprintf(dstname, "oD%s%s", dstmask, sat);
587                 break;
588         case 6:
589                 if (dst_nr > 3)
590                         fprintf(out, "bad destination reg U%d\n", dst_nr);
591                 sprintf(dstname, "U%d%s%s", dst_nr, dstmask, sat);
592                 break;
593         default:
594                 sprintf(dstname, "RESERVED");
595                 break;
596         }
597 }
598
599 static const char *
600 i915_get_channel_swizzle(uint32_t select)
601 {
602         switch (select & 0x7) {
603         case 0:
604                 return (select & 8) ? "-x" : "x";
605         case 1:
606                 return (select & 8) ? "-y" : "y";
607         case 2:
608                 return (select & 8) ? "-z" : "z";
609         case 3:
610                 return (select & 8) ? "-w" : "w";
611         case 4:
612                 return (select & 8) ? "-0" : "0";
613         case 5:
614                 return (select & 8) ? "-1" : "1";
615         default:
616                 return (select & 8) ? "-bad" : "bad";
617         }
618 }
619
620 static void
621 i915_get_instruction_src_name(uint32_t src_type, uint32_t src_nr, char *name)
622 {
623         switch (src_type) {
624         case 0:
625                 sprintf(name, "R%d", src_nr);
626                 if (src_nr > 15)
627                         fprintf(out, "bad src reg %s\n", name);
628                 break;
629         case 1:
630                 if (src_nr < 8)
631                         sprintf(name, "T%d", src_nr);
632                 else if (src_nr == 8)
633                         sprintf(name, "DIFFUSE");
634                 else if (src_nr == 9)
635                         sprintf(name, "SPECULAR");
636                 else if (src_nr == 10)
637                         sprintf(name, "FOG");
638                 else {
639                         fprintf(out, "bad src reg T%d\n", src_nr);
640                         sprintf(name, "RESERVED");
641                 }
642                 break;
643         case 2:
644                 sprintf(name, "C%d", src_nr);
645                 if (src_nr > 31)
646                         fprintf(out, "bad src reg %s\n", name);
647                 break;
648         case 4:
649                 sprintf(name, "oC");
650                 if (src_nr > 0)
651                         fprintf(out, "bad src reg oC%d\n", src_nr);
652                 break;
653         case 5:
654                 sprintf(name, "oD");
655                 if (src_nr > 0)
656                         fprintf(out, "bad src reg oD%d\n", src_nr);
657                 break;
658         case 6:
659                 sprintf(name, "U%d", src_nr);
660                 if (src_nr > 3)
661                         fprintf(out, "bad src reg %s\n", name);
662                 break;
663         default:
664                 fprintf(out, "bad src reg type %d\n", src_type);
665                 sprintf(name, "RESERVED");
666                 break;
667         }
668 }
669
670 static void i915_get_instruction_src0(uint32_t *data, int i, char *srcname)
671 {
672         uint32_t a0 = data[i];
673         uint32_t a1 = data[i + 1];
674         int src_nr = (a0 >> 2) & 0x1f;
675         const char *swizzle_x = i915_get_channel_swizzle((a1 >> 28) & 0xf);
676         const char *swizzle_y = i915_get_channel_swizzle((a1 >> 24) & 0xf);
677         const char *swizzle_z = i915_get_channel_swizzle((a1 >> 20) & 0xf);
678         const char *swizzle_w = i915_get_channel_swizzle((a1 >> 16) & 0xf);
679         char swizzle[100];
680
681         i915_get_instruction_src_name((a0 >> 7) & 0x7, src_nr, srcname);
682         sprintf(swizzle, ".%s%s%s%s", swizzle_x, swizzle_y, swizzle_z,
683                 swizzle_w);
684         if (strcmp(swizzle, ".xyzw") != 0)
685                 strcat(srcname, swizzle);
686 }
687
688 static void i915_get_instruction_src1(uint32_t *data, int i, char *srcname)
689 {
690         uint32_t a1 = data[i + 1];
691         uint32_t a2 = data[i + 2];
692         int src_nr = (a1 >> 8) & 0x1f;
693         const char *swizzle_x = i915_get_channel_swizzle((a1 >> 4) & 0xf);
694         const char *swizzle_y = i915_get_channel_swizzle((a1 >> 0) & 0xf);
695         const char *swizzle_z = i915_get_channel_swizzle((a2 >> 28) & 0xf);
696         const char *swizzle_w = i915_get_channel_swizzle((a2 >> 24) & 0xf);
697         char swizzle[100];
698
699         i915_get_instruction_src_name((a1 >> 13) & 0x7, src_nr, srcname);
700         sprintf(swizzle, ".%s%s%s%s", swizzle_x, swizzle_y, swizzle_z,
701                 swizzle_w);
702         if (strcmp(swizzle, ".xyzw") != 0)
703                 strcat(srcname, swizzle);
704 }
705
706 static void i915_get_instruction_src2(uint32_t *data, int i, char *srcname)
707 {
708         uint32_t a2 = data[i + 2];
709         int src_nr = (a2 >> 16) & 0x1f;
710         const char *swizzle_x = i915_get_channel_swizzle((a2 >> 12) & 0xf);
711         const char *swizzle_y = i915_get_channel_swizzle((a2 >> 8) & 0xf);
712         const char *swizzle_z = i915_get_channel_swizzle((a2 >> 4) & 0xf);
713         const char *swizzle_w = i915_get_channel_swizzle((a2 >> 0) & 0xf);
714         char swizzle[100];
715
716         i915_get_instruction_src_name((a2 >> 21) & 0x7, src_nr, srcname);
717         sprintf(swizzle, ".%s%s%s%s", swizzle_x, swizzle_y, swizzle_z,
718                 swizzle_w);
719         if (strcmp(swizzle, ".xyzw") != 0)
720                 strcat(srcname, swizzle);
721 }
722
723 static void
724 i915_get_instruction_addr(uint32_t src_type, uint32_t src_nr, char *name)
725 {
726         switch (src_type) {
727         case 0:
728                 sprintf(name, "R%d", src_nr);
729                 if (src_nr > 15)
730                         fprintf(out, "bad src reg %s\n", name);
731                 break;
732         case 1:
733                 if (src_nr < 8)
734                         sprintf(name, "T%d", src_nr);
735                 else if (src_nr == 8)
736                         sprintf(name, "DIFFUSE");
737                 else if (src_nr == 9)
738                         sprintf(name, "SPECULAR");
739                 else if (src_nr == 10)
740                         sprintf(name, "FOG");
741                 else {
742                         fprintf(out, "bad src reg T%d\n", src_nr);
743                         sprintf(name, "RESERVED");
744                 }
745                 break;
746         case 4:
747                 sprintf(name, "oC");
748                 if (src_nr > 0)
749                         fprintf(out, "bad src reg oC%d\n", src_nr);
750                 break;
751         case 5:
752                 sprintf(name, "oD");
753                 if (src_nr > 0)
754                         fprintf(out, "bad src reg oD%d\n", src_nr);
755                 break;
756         default:
757                 fprintf(out, "bad src reg type %d\n", src_type);
758                 sprintf(name, "RESERVED");
759                 break;
760         }
761 }
762
763 static void
764 i915_decode_alu1(uint32_t *data, uint32_t hw_offset,
765                  int i, char *instr_prefix, const char *op_name)
766 {
767         char dst[100], src0[100];
768
769         i915_get_instruction_dst(data, i, dst, 1);
770         i915_get_instruction_src0(data, i, src0);
771
772         instr_out(data, hw_offset, i++, "%s: %s %s, %s\n", instr_prefix,
773                   op_name, dst, src0);
774         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
775         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
776 }
777
778 static void
779 i915_decode_alu2(uint32_t *data, uint32_t hw_offset,
780                  int i, char *instr_prefix, const char *op_name)
781 {
782         char dst[100], src0[100], src1[100];
783
784         i915_get_instruction_dst(data, i, dst, 1);
785         i915_get_instruction_src0(data, i, src0);
786         i915_get_instruction_src1(data, i, src1);
787
788         instr_out(data, hw_offset, i++, "%s: %s %s, %s, %s\n", instr_prefix,
789                   op_name, dst, src0, src1);
790         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
791         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
792 }
793
794 static void
795 i915_decode_alu3(uint32_t *data, uint32_t hw_offset,
796                  int i, char *instr_prefix, const char *op_name)
797 {
798         char dst[100], src0[100], src1[100], src2[100];
799
800         i915_get_instruction_dst(data, i, dst, 1);
801         i915_get_instruction_src0(data, i, src0);
802         i915_get_instruction_src1(data, i, src1);
803         i915_get_instruction_src2(data, i, src2);
804
805         instr_out(data, hw_offset, i++, "%s: %s %s, %s, %s, %s\n", instr_prefix,
806                   op_name, dst, src0, src1, src2);
807         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
808         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
809 }
810
811 static void
812 i915_decode_tex(uint32_t *data, uint32_t hw_offset, int i,
813                 const char *instr_prefix, const char *tex_name)
814 {
815         uint32_t t0 = data[i];
816         uint32_t t1 = data[i + 1];
817         char dst_name[100];
818         char addr_name[100];
819         int sampler_nr;
820
821         i915_get_instruction_dst(data, i, dst_name, 0);
822         i915_get_instruction_addr((t1 >> 24) & 0x7,
823                                   (t1 >> 17) & 0xf, addr_name);
824         sampler_nr = t0 & 0xf;
825
826         instr_out(data, hw_offset, i++, "%s: %s %s, S%d, %s\n", instr_prefix,
827                   tex_name, dst_name, sampler_nr, addr_name);
828         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
829         instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
830 }
831
832 static void
833 i915_decode_dcl(uint32_t *data, uint32_t hw_offset, int i, char *instr_prefix)
834 {
835         uint32_t d0 = data[i];
836         const char *sampletype;
837         int dcl_nr = (d0 >> 14) & 0xf;
838         const char *dcl_x = d0 & (1 << 10) ? "x" : "";
839         const char *dcl_y = d0 & (1 << 11) ? "y" : "";
840         const char *dcl_z = d0 & (1 << 12) ? "z" : "";
841         const char *dcl_w = d0 & (1 << 13) ? "w" : "";
842         char dcl_mask[10];
843
844         switch ((d0 >> 19) & 0x3) {
845         case 1:
846                 sprintf(dcl_mask, ".%s%s%s%s", dcl_x, dcl_y, dcl_z, dcl_w);
847                 if (strcmp(dcl_mask, ".") == 0)
848                         fprintf(out, "bad (empty) dcl mask\n");
849
850                 if (dcl_nr > 10)
851                         fprintf(out, "bad T%d dcl register number\n", dcl_nr);
852                 if (dcl_nr < 8) {
853                         if (strcmp(dcl_mask, ".x") != 0 &&
854                             strcmp(dcl_mask, ".xy") != 0 &&
855                             strcmp(dcl_mask, ".xz") != 0 &&
856                             strcmp(dcl_mask, ".w") != 0 &&
857                             strcmp(dcl_mask, ".xyzw") != 0) {
858                                 fprintf(out, "bad T%d.%s dcl mask\n", dcl_nr,
859                                         dcl_mask);
860                         }
861                         instr_out(data, hw_offset, i++, "%s: DCL T%d%s\n",
862                                   instr_prefix, dcl_nr, dcl_mask);
863                 } else {
864                         if (strcmp(dcl_mask, ".xz") == 0)
865                                 fprintf(out, "errataed bad dcl mask %s\n",
866                                         dcl_mask);
867                         else if (strcmp(dcl_mask, ".xw") == 0)
868                                 fprintf(out, "errataed bad dcl mask %s\n",
869                                         dcl_mask);
870                         else if (strcmp(dcl_mask, ".xzw") == 0)
871                                 fprintf(out, "errataed bad dcl mask %s\n",
872                                         dcl_mask);
873
874                         if (dcl_nr == 8) {
875                                 instr_out(data, hw_offset, i++,
876                                           "%s: DCL DIFFUSE%s\n", instr_prefix,
877                                           dcl_mask);
878                         } else if (dcl_nr == 9) {
879                                 instr_out(data, hw_offset, i++,
880                                           "%s: DCL SPECULAR%s\n", instr_prefix,
881                                           dcl_mask);
882                         } else if (dcl_nr == 10) {
883                                 instr_out(data, hw_offset, i++,
884                                           "%s: DCL FOG%s\n", instr_prefix,
885                                           dcl_mask);
886                         }
887                 }
888                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
889                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
890                 break;
891         case 3:
892                 switch ((d0 >> 22) & 0x3) {
893                 case 0:
894                         sampletype = "2D";
895                         break;
896                 case 1:
897                         sampletype = "CUBE";
898                         break;
899                 case 2:
900                         sampletype = "3D";
901                         break;
902                 default:
903                         sampletype = "RESERVED";
904                         break;
905                 }
906                 if (dcl_nr > 15)
907                         fprintf(out, "bad S%d dcl register number\n", dcl_nr);
908                 instr_out(data, hw_offset, i++, "%s: DCL S%d %s\n",
909                           instr_prefix, dcl_nr, sampletype);
910                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
911                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
912                 break;
913         default:
914                 instr_out(data, hw_offset, i++, "%s: DCL RESERVED%d\n",
915                           instr_prefix, dcl_nr);
916                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
917                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
918         }
919 }
920
921 static void
922 i915_decode_instruction(uint32_t *data, uint32_t hw_offset,
923                         int i, char *instr_prefix)
924 {
925         switch ((data[i] >> 24) & 0x1f) {
926         case 0x0:
927                 instr_out(data, hw_offset, i++, "%s: NOP\n", instr_prefix);
928                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
929                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
930                 break;
931         case 0x01:
932                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "ADD");
933                 break;
934         case 0x02:
935                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "MOV");
936                 break;
937         case 0x03:
938                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "MUL");
939                 break;
940         case 0x04:
941                 i915_decode_alu3(data, hw_offset, i, instr_prefix, "MAD");
942                 break;
943         case 0x05:
944                 i915_decode_alu3(data, hw_offset, i, instr_prefix, "DP2ADD");
945                 break;
946         case 0x06:
947                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "DP3");
948                 break;
949         case 0x07:
950                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "DP4");
951                 break;
952         case 0x08:
953                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "FRC");
954                 break;
955         case 0x09:
956                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "RCP");
957                 break;
958         case 0x0a:
959                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "RSQ");
960                 break;
961         case 0x0b:
962                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "EXP");
963                 break;
964         case 0x0c:
965                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "LOG");
966                 break;
967         case 0x0d:
968                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "CMP");
969                 break;
970         case 0x0e:
971                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "MIN");
972                 break;
973         case 0x0f:
974                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "MAX");
975                 break;
976         case 0x10:
977                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "FLR");
978                 break;
979         case 0x11:
980                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "MOD");
981                 break;
982         case 0x12:
983                 i915_decode_alu1(data, hw_offset, i, instr_prefix, "TRC");
984                 break;
985         case 0x13:
986                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "SGE");
987                 break;
988         case 0x14:
989                 i915_decode_alu2(data, hw_offset, i, instr_prefix, "SLT");
990                 break;
991         case 0x15:
992                 i915_decode_tex(data, hw_offset, i, instr_prefix, "TEXLD");
993                 break;
994         case 0x16:
995                 i915_decode_tex(data, hw_offset, i, instr_prefix, "TEXLDP");
996                 break;
997         case 0x17:
998                 i915_decode_tex(data, hw_offset, i, instr_prefix, "TEXLDB");
999                 break;
1000         case 0x19:
1001                 i915_decode_dcl(data, hw_offset, i, instr_prefix);
1002                 break;
1003         default:
1004                 instr_out(data, hw_offset, i++, "%s: unknown\n", instr_prefix);
1005                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
1006                 instr_out(data, hw_offset, i++, "%s\n", instr_prefix);
1007                 break;
1008         }
1009 }
1010
1011 static const char *
1012 decode_compare_func(uint32_t op)
1013 {
1014         switch (op & 0x7) {
1015         case 0:
1016                 return "always";
1017         case 1:
1018                 return "never";
1019         case 2:
1020                 return "less";
1021         case 3:
1022                 return "equal";
1023         case 4:
1024                 return "lequal";
1025         case 5:
1026                 return "greater";
1027         case 6:
1028                 return "notequal";
1029         case 7:
1030                 return "gequal";
1031         }
1032         return "";
1033 }
1034
1035 static const char *
1036 decode_stencil_op(uint32_t op)
1037 {
1038         switch (op & 0x7) {
1039         case 0:
1040                 return "keep";
1041         case 1:
1042                 return "zero";
1043         case 2:
1044                 return "replace";
1045         case 3:
1046                 return "incr_sat";
1047         case 4:
1048                 return "decr_sat";
1049         case 5:
1050                 return "greater";
1051         case 6:
1052                 return "incr";
1053         case 7:
1054                 return "decr";
1055         }
1056         return "";
1057 }
1058
1059 #if 0
1060 static const char *
1061 decode_logic_op(uint32_t op)
1062 {
1063         switch (op & 0xf) {
1064         case 0:
1065                 return "clear";
1066         case 1:
1067                 return "nor";
1068         case 2:
1069                 return "and_inv";
1070         case 3:
1071                 return "copy_inv";
1072         case 4:
1073                 return "and_rvrse";
1074         case 5:
1075                 return "inv";
1076         case 6:
1077                 return "xor";
1078         case 7:
1079                 return "nand";
1080         case 8:
1081                 return "and";
1082         case 9:
1083                 return "equiv";
1084         case 10:
1085                 return "noop";
1086         case 11:
1087                 return "or_inv";
1088         case 12:
1089                 return "copy";
1090         case 13:
1091                 return "or_rvrse";
1092         case 14:
1093                 return "or";
1094         case 15:
1095                 return "set";
1096         }
1097         return "";
1098 }
1099 #endif
1100
1101 static const char *
1102 decode_blend_fact(uint32_t op)
1103 {
1104         switch (op & 0xf) {
1105         case 1:
1106                 return "zero";
1107         case 2:
1108                 return "one";
1109         case 3:
1110                 return "src_colr";
1111         case 4:
1112                 return "inv_src_colr";
1113         case 5:
1114                 return "src_alpha";
1115         case 6:
1116                 return "inv_src_alpha";
1117         case 7:
1118                 return "dst_alpha";
1119         case 8:
1120                 return "inv_dst_alpha";
1121         case 9:
1122                 return "dst_colr";
1123         case 10:
1124                 return "inv_dst_colr";
1125         case 11:
1126                 return "src_alpha_sat";
1127         case 12:
1128                 return "cnst_colr";
1129         case 13:
1130                 return "inv_cnst_colr";
1131         case 14:
1132                 return "cnst_alpha";
1133         case 15:
1134                 return "inv_const_alpha";
1135         }
1136         return "";
1137 }
1138
1139 static const char *
1140 decode_tex_coord_mode(uint32_t mode)
1141 {
1142         switch (mode & 0x7) {
1143         case 0:
1144                 return "wrap";
1145         case 1:
1146                 return "mirror";
1147         case 2:
1148                 return "clamp_edge";
1149         case 3:
1150                 return "cube";
1151         case 4:
1152                 return "clamp_border";
1153         case 5:
1154                 return "mirror_once";
1155         }
1156         return "";
1157 }
1158
1159 static const char *
1160 decode_sample_filter(uint32_t mode)
1161 {
1162         switch (mode & 0x7) {
1163         case 0:
1164                 return "nearest";
1165         case 1:
1166                 return "linear";
1167         case 2:
1168                 return "anisotropic";
1169         case 3:
1170                 return "4x4_1";
1171         case 4:
1172                 return "4x4_2";
1173         case 5:
1174                 return "4x4_flat";
1175         case 6:
1176                 return "6x5_mono";
1177         }
1178         return "";
1179 }
1180
1181 static int
1182 decode_3d_1d(struct drm_intel_decode *ctx)
1183 {
1184         unsigned int len, i, c, idx, word, map, sampler, instr;
1185         const char *format, *zformat, *type;
1186         uint32_t opcode;
1187         uint32_t hw_offset = ctx->hw_offset;
1188         uint32_t *data = ctx->data;
1189         uint32_t count = ctx->count;
1190         uint32_t devid = ctx->devid;
1191
1192         struct {
1193                 uint32_t opcode;
1194                 int i830_only;
1195                 unsigned int min_len;
1196                 unsigned int max_len;
1197                 const char *name;
1198         } opcodes_3d_1d[] = {
1199                 { 0x86, 0, 4, 4, "3DSTATE_CHROMA_KEY" },
1200                 { 0x88, 0, 2, 2, "3DSTATE_CONSTANT_BLEND_COLOR" },
1201                 { 0x99, 0, 2, 2, "3DSTATE_DEFAULT_DIFFUSE" },
1202                 { 0x9a, 0, 2, 2, "3DSTATE_DEFAULT_SPECULAR" },
1203                 { 0x98, 0, 2, 2, "3DSTATE_DEFAULT_Z" },
1204                 { 0x97, 0, 2, 2, "3DSTATE_DEPTH_OFFSET_SCALE" },
1205                 { 0x9d, 0, 65, 65, "3DSTATE_FILTER_COEFFICIENTS_4X4" },
1206                 { 0x9e, 0, 4, 4, "3DSTATE_MONO_FILTER" },
1207                 { 0x89, 0, 4, 4, "3DSTATE_FOG_MODE" },
1208                 { 0x8f, 0, 2, 16, "3DSTATE_MAP_PALLETE_LOAD_32" },
1209                 { 0x83, 0, 2, 2, "3DSTATE_SPAN_STIPPLE" },
1210                 { 0x8c, 1, 2, 2, "3DSTATE_MAP_COORD_TRANSFORM_I830" },
1211                 { 0x8b, 1, 2, 2, "3DSTATE_MAP_VERTEX_TRANSFORM_I830" },
1212                 { 0x8d, 1, 3, 3, "3DSTATE_W_STATE_I830" },
1213                 { 0x01, 1, 2, 2, "3DSTATE_COLOR_FACTOR_I830" },
1214                 { 0x02, 1, 2, 2, "3DSTATE_MAP_COORD_SETBIND_I830"},
1215         }, *opcode_3d_1d;
1216
1217         opcode = (data[0] & 0x00ff0000) >> 16;
1218
1219         switch (opcode) {
1220         case 0x07:
1221                 /* This instruction is unusual.  A 0 length means just
1222                  * 1 DWORD instead of 2.  The 0 length is specified in
1223                  * one place to be unsupported, but stated to be
1224                  * required in another, and 0 length LOAD_INDIRECTs
1225                  * appear to cause no harm at least.
1226                  */
1227                 instr_out(data, hw_offset, 0, "3DSTATE_LOAD_INDIRECT\n");
1228                 len = (data[0] & 0x000000ff) + 1;
1229                 i = 1;
1230                 if (data[0] & (0x01 << 8)) {
1231                         if (i + 2 >= count)
1232                                 BUFFER_FAIL(count, len,
1233                                             "3DSTATE_LOAD_INDIRECT");
1234                         instr_out(data, hw_offset, i++, "SIS.0\n");
1235                         instr_out(data, hw_offset, i++, "SIS.1\n");
1236                 }
1237                 if (data[0] & (0x02 << 8)) {
1238                         if (i + 1 >= count)
1239                                 BUFFER_FAIL(count, len,
1240                                             "3DSTATE_LOAD_INDIRECT");
1241                         instr_out(data, hw_offset, i++, "DIS.0\n");
1242                 }
1243                 if (data[0] & (0x04 << 8)) {
1244                         if (i + 2 >= count)
1245                                 BUFFER_FAIL(count, len,
1246                                             "3DSTATE_LOAD_INDIRECT");
1247                         instr_out(data, hw_offset, i++, "SSB.0\n");
1248                         instr_out(data, hw_offset, i++, "SSB.1\n");
1249                 }
1250                 if (data[0] & (0x08 << 8)) {
1251                         if (i + 2 >= count)
1252                                 BUFFER_FAIL(count, len,
1253                                             "3DSTATE_LOAD_INDIRECT");
1254                         instr_out(data, hw_offset, i++, "MSB.0\n");
1255                         instr_out(data, hw_offset, i++, "MSB.1\n");
1256                 }
1257                 if (data[0] & (0x10 << 8)) {
1258                         if (i + 2 >= count)
1259                                 BUFFER_FAIL(count, len,
1260                                             "3DSTATE_LOAD_INDIRECT");
1261                         instr_out(data, hw_offset, i++, "PSP.0\n");
1262                         instr_out(data, hw_offset, i++, "PSP.1\n");
1263                 }
1264                 if (data[0] & (0x20 << 8)) {
1265                         if (i + 2 >= count)
1266                                 BUFFER_FAIL(count, len,
1267                                             "3DSTATE_LOAD_INDIRECT");
1268                         instr_out(data, hw_offset, i++, "PSC.0\n");
1269                         instr_out(data, hw_offset, i++, "PSC.1\n");
1270                 }
1271                 if (len != i) {
1272                         fprintf(out, "Bad count in 3DSTATE_LOAD_INDIRECT\n");
1273                         return len;
1274                 }
1275                 return len;
1276         case 0x04:
1277                 instr_out(data, hw_offset, 0,
1278                           "3DSTATE_LOAD_STATE_IMMEDIATE_1\n");
1279                 len = (data[0] & 0x0000000f) + 2;
1280                 i = 1;
1281                 for (word = 0; word <= 8; word++) {
1282                         if (data[0] & (1 << (4 + word))) {
1283                                 if (i >= count)
1284                                         BUFFER_FAIL(count, len,
1285                                                     "3DSTATE_LOAD_STATE_IMMEDIATE_1");
1286
1287                                 /* save vertex state for decode */
1288                                 if (!IS_GEN2(devid)) {
1289                                         int tex_num;
1290
1291                                         if (word == 2) {
1292                                                 saved_s2_set = 1;
1293                                                 saved_s2 = data[i];
1294                                         }
1295                                         if (word == 4) {
1296                                                 saved_s4_set = 1;
1297                                                 saved_s4 = data[i];
1298                                         }
1299
1300                                         switch (word) {
1301                                         case 0:
1302                                                 instr_out(data, hw_offset, i,
1303                                                           "S0: vbo offset: 0x%08x%s\n",
1304                                                           data[i] & (~1),
1305                                                           data[i] & 1 ?
1306                                                           ", auto cache invalidate disabled"
1307                                                           : "");
1308                                                 break;
1309                                         case 1:
1310                                                 instr_out(data, hw_offset, i,
1311                                                           "S1: vertex width: %i, vertex pitch: %i\n",
1312                                                           (data[i] >> 24) &
1313                                                           0x3f,
1314                                                           (data[i] >> 16) &
1315                                                           0x3f);
1316                                                 break;
1317                                         case 2:
1318                                                 instr_out(data, hw_offset, i,
1319                                                           "S2: texcoord formats: ");
1320                                                 for (tex_num = 0;
1321                                                      tex_num < 8; tex_num++) {
1322                                                         switch ((data[i] >>
1323                                                                  tex_num *
1324                                                                  4) & 0xf) {
1325                                                         case 0:
1326                                                                 fprintf(out,
1327                                                                         "%i=2D ",
1328                                                                         tex_num);
1329                                                                 break;
1330                                                         case 1:
1331                                                                 fprintf(out,
1332                                                                         "%i=3D ",
1333                                                                         tex_num);
1334                                                                 break;
1335                                                         case 2:
1336                                                                 fprintf(out,
1337                                                                         "%i=4D ",
1338                                                                         tex_num);
1339                                                                 break;
1340                                                         case 3:
1341                                                                 fprintf(out,
1342                                                                         "%i=1D ",
1343                                                                         tex_num);
1344                                                                 break;
1345                                                         case 4:
1346                                                                 fprintf(out,
1347                                                                         "%i=2D_16 ",
1348                                                                         tex_num);
1349                                                                 break;
1350                                                         case 5:
1351                                                                 fprintf(out,
1352                                                                         "%i=4D_16 ",
1353                                                                         tex_num);
1354                                                                 break;
1355                                                         case 0xf:
1356                                                                 fprintf(out,
1357                                                                         "%i=NP ",
1358                                                                         tex_num);
1359                                                                 break;
1360                                                         }
1361                                                 }
1362                                                 fprintf(out, "\n");
1363
1364                                                 break;
1365                                         case 3:
1366                                                 instr_out(data, hw_offset, i,
1367                                                           "S3: not documented\n");
1368                                                 break;
1369                                         case 4:
1370                                                 {
1371                                                         const char *cullmode = "";
1372                                                         const char *vfmt_xyzw = "";
1373                                                         switch ((data[i] >> 13)
1374                                                                 & 0x3) {
1375                                                         case 0:
1376                                                                 cullmode =
1377                                                                     "both";
1378                                                                 break;
1379                                                         case 1:
1380                                                                 cullmode =
1381                                                                     "none";
1382                                                                 break;
1383                                                         case 2:
1384                                                                 cullmode = "cw";
1385                                                                 break;
1386                                                         case 3:
1387                                                                 cullmode =
1388                                                                     "ccw";
1389                                                                 break;
1390                                                         }
1391                                                         switch (data[i] &
1392                                                                 (7 << 6 | 1 <<
1393                                                                  2)) {
1394                                                         case 1 << 6:
1395                                                                 vfmt_xyzw =
1396                                                                     "XYZ,";
1397                                                                 break;
1398                                                         case 2 << 6:
1399                                                                 vfmt_xyzw =
1400                                                                     "XYZW,";
1401                                                                 break;
1402                                                         case 3 << 6:
1403                                                                 vfmt_xyzw =
1404                                                                     "XY,";
1405                                                                 break;
1406                                                         case 4 << 6:
1407                                                                 vfmt_xyzw =
1408                                                                     "XYW,";
1409                                                                 break;
1410                                                         case 1 << 6 | 1 << 2:
1411                                                                 vfmt_xyzw =
1412                                                                     "XYZF,";
1413                                                                 break;
1414                                                         case 2 << 6 | 1 << 2:
1415                                                                 vfmt_xyzw =
1416                                                                     "XYZWF,";
1417                                                                 break;
1418                                                         case 3 << 6 | 1 << 2:
1419                                                                 vfmt_xyzw =
1420                                                                     "XYF,";
1421                                                                 break;
1422                                                         case 4 << 6 | 1 << 2:
1423                                                                 vfmt_xyzw =
1424                                                                     "XYWF,";
1425                                                                 break;
1426                                                         }
1427                                                         instr_out(data,
1428                                                                   hw_offset, i,
1429                                                                   "S4: point_width=%i, line_width=%.1f,"
1430                                                                   "%s%s%s%s%s cullmode=%s, vfmt=%s%s%s%s%s%s "
1431                                                                   "%s%s%s%s%s\n",
1432                                                                   (data[i] >>
1433                                                                    23) & 0x1ff,
1434                                                                   ((data[i] >>
1435                                                                     19) & 0xf) /
1436                                                                   2.0,
1437                                                                   data[i] & (0xf
1438                                                                              <<
1439                                                                              15)
1440                                                                   ?
1441                                                                   " flatshade="
1442                                                                   : "",
1443                                                                   data[i] & (1
1444                                                                              <<
1445                                                                              18)
1446                                                                   ? "Alpha," :
1447                                                                   "",
1448                                                                   data[i] & (1
1449                                                                              <<
1450                                                                              17)
1451                                                                   ? "Fog," : "",
1452                                                                   data[i] & (1
1453                                                                              <<
1454                                                                              16)
1455                                                                   ? "Specular,"
1456                                                                   : "",
1457                                                                   data[i] & (1
1458                                                                              <<
1459                                                                              15)
1460                                                                   ? "Color," :
1461                                                                   "", cullmode,
1462                                                                   data[i] & (1
1463                                                                              <<
1464                                                                              12)
1465                                                                   ?
1466                                                                   "PointWidth,"
1467                                                                   : "",
1468                                                                   data[i] & (1
1469                                                                              <<
1470                                                                              11)
1471                                                                   ? "SpecFog," :
1472                                                                   "",
1473                                                                   data[i] & (1
1474                                                                              <<
1475                                                                              10)
1476                                                                   ? "Color," :
1477                                                                   "",
1478                                                                   data[i] & (1
1479                                                                              <<
1480                                                                              9)
1481                                                                   ? "DepthOfs,"
1482                                                                   : "",
1483                                                                   vfmt_xyzw,
1484                                                                   data[i] & (1
1485                                                                              <<
1486                                                                              9)
1487                                                                   ? "FogParam,"
1488                                                                   : "",
1489                                                                   data[i] & (1
1490                                                                              <<
1491                                                                              5)
1492                                                                   ?
1493                                                                   "force default diffuse, "
1494                                                                   : "",
1495                                                                   data[i] & (1
1496                                                                              <<
1497                                                                              4)
1498                                                                   ?
1499                                                                   "force default specular, "
1500                                                                   : "",
1501                                                                   data[i] & (1
1502                                                                              <<
1503                                                                              3)
1504                                                                   ?
1505                                                                   "local depth ofs enable, "
1506                                                                   : "",
1507                                                                   data[i] & (1
1508                                                                              <<
1509                                                                              1)
1510                                                                   ?
1511                                                                   "point sprite enable, "
1512                                                                   : "",
1513                                                                   data[i] & (1
1514                                                                              <<
1515                                                                              0)
1516                                                                   ?
1517                                                                   "line AA enable, "
1518                                                                   : "");
1519                                                         break;
1520                                                 }
1521                                         case 5:
1522                                                 {
1523                                                         instr_out(data,
1524                                                                   hw_offset, i,
1525                                                                   "S5:%s%s%s%s%s"
1526                                                                   "%s%s%s%s stencil_ref=0x%x, stencil_test=%s, "
1527                                                                   "stencil_fail=%s, stencil_pass_z_fail=%s, "
1528                                                                   "stencil_pass_z_pass=%s, %s%s%s%s\n",
1529                                                                   data[i] & (0xf
1530                                                                              <<
1531                                                                              28)
1532                                                                   ?
1533                                                                   " write_disable="
1534                                                                   : "",
1535                                                                   data[i] & (1
1536                                                                              <<
1537                                                                              31)
1538                                                                   ? "Alpha," :
1539                                                                   "",
1540                                                                   data[i] & (1
1541                                                                              <<
1542                                                                              30)
1543                                                                   ? "Red," : "",
1544                                                                   data[i] & (1
1545                                                                              <<
1546                                                                              29)
1547                                                                   ? "Green," :
1548                                                                   "",
1549                                                                   data[i] & (1
1550                                                                              <<
1551                                                                              28)
1552                                                                   ? "Blue," :
1553                                                                   "",
1554                                                                   data[i] & (1
1555                                                                              <<
1556                                                                              27)
1557                                                                   ?
1558                                                                   " force default point size,"
1559                                                                   : "",
1560                                                                   data[i] & (1
1561                                                                              <<
1562                                                                              26)
1563                                                                   ?
1564                                                                   " last pixel enable,"
1565                                                                   : "",
1566                                                                   data[i] & (1
1567                                                                              <<
1568                                                                              25)
1569                                                                   ?
1570                                                                   " global depth ofs enable,"
1571                                                                   : "",
1572                                                                   data[i] & (1
1573                                                                              <<
1574                                                                              24)
1575                                                                   ?
1576                                                                   " fog enable,"
1577                                                                   : "",
1578                                                                   (data[i] >>
1579                                                                    16) & 0xff,
1580                                                                   decode_compare_func
1581                                                                   (data[i] >>
1582                                                                    13),
1583                                                                   decode_stencil_op
1584                                                                   (data[i] >>
1585                                                                    10),
1586                                                                   decode_stencil_op
1587                                                                   (data[i] >>
1588                                                                    7),
1589                                                                   decode_stencil_op
1590                                                                   (data[i] >>
1591                                                                    4),
1592                                                                   data[i] & (1
1593                                                                              <<
1594                                                                              3)
1595                                                                   ?
1596                                                                   "stencil write enable, "
1597                                                                   : "",
1598                                                                   data[i] & (1
1599                                                                              <<
1600                                                                              2)
1601                                                                   ?
1602                                                                   "stencil test enable, "
1603                                                                   : "",
1604                                                                   data[i] & (1
1605                                                                              <<
1606                                                                              1)
1607                                                                   ?
1608                                                                   "color dither enable, "
1609                                                                   : "",
1610                                                                   data[i] & (1
1611                                                                              <<
1612                                                                              0)
1613                                                                   ?
1614                                                                   "logicop enable, "
1615                                                                   : "");
1616                                                 }
1617                                                 break;
1618                                         case 6:
1619                                                 instr_out(data, hw_offset, i,
1620                                                           "S6: %salpha_test=%s, alpha_ref=0x%x, "
1621                                                           "depth_test=%s, %ssrc_blnd_fct=%s, dst_blnd_fct=%s, "
1622                                                           "%s%stristrip_provoking_vertex=%i\n",
1623                                                           data[i] & (1 << 31) ?
1624                                                           "alpha test enable, "
1625                                                           : "",
1626                                                           decode_compare_func
1627                                                           (data[i] >> 28),
1628                                                           data[i] & (0xff <<
1629                                                                      20),
1630                                                           decode_compare_func
1631                                                           (data[i] >> 16),
1632                                                           data[i] & (1 << 15) ?
1633                                                           "cbuf blend enable, "
1634                                                           : "",
1635                                                           decode_blend_fact(data
1636                                                                             [i]
1637                                                                             >>
1638                                                                             8),
1639                                                           decode_blend_fact(data
1640                                                                             [i]
1641                                                                             >>
1642                                                                             4),
1643                                                           data[i] & (1 << 3) ?
1644                                                           "depth write enable, "
1645                                                           : "",
1646                                                           data[i] & (1 << 2) ?
1647                                                           "cbuf write enable, "
1648                                                           : "",
1649                                                           data[i] & (0x3));
1650                                                 break;
1651                                         case 7:
1652                                                 instr_out(data, hw_offset, i,
1653                                                           "S7: depth offset constant: 0x%08x\n",
1654                                                           data[i]);
1655                                                 break;
1656                                         }
1657                                 } else {
1658                                         instr_out(data, hw_offset, i,
1659                                                   "S%d: 0x%08x\n", i, data[i]);
1660                                 }
1661                                 i++;
1662                         }
1663                 }
1664                 if (len != i) {
1665                         fprintf(out,
1666                                 "Bad count in 3DSTATE_LOAD_STATE_IMMEDIATE_1\n");
1667                 }
1668                 return len;
1669         case 0x03:
1670                 instr_out(data, hw_offset, 0,
1671                           "3DSTATE_LOAD_STATE_IMMEDIATE_2\n");
1672                 len = (data[0] & 0x0000000f) + 2;
1673                 i = 1;
1674                 for (word = 6; word <= 14; word++) {
1675                         if (data[0] & (1 << word)) {
1676                                 if (i >= count)
1677                                         BUFFER_FAIL(count, len,
1678                                                     "3DSTATE_LOAD_STATE_IMMEDIATE_2");
1679
1680                                 if (word == 6)
1681                                         instr_out(data, hw_offset, i++,
1682                                                   "TBCF\n");
1683                                 else if (word >= 7 && word <= 10) {
1684                                         instr_out(data, hw_offset, i++,
1685                                                   "TB%dC\n", word - 7);
1686                                         instr_out(data, hw_offset, i++,
1687                                                   "TB%dA\n", word - 7);
1688                                 } else if (word >= 11 && word <= 14) {
1689                                         instr_out(data, hw_offset, i,
1690                                                   "TM%dS0: offset=0x%08x, %s\n",
1691                                                   word - 11,
1692                                                   data[i] & 0xfffffffe,
1693                                                   data[i] & 1 ? "use fence" :
1694                                                   "");
1695                                         i++;
1696                                         instr_out(data, hw_offset, i,
1697                                                   "TM%dS1: height=%i, width=%i, %s\n",
1698                                                   word - 11, data[i] >> 21,
1699                                                   (data[i] >> 10) & 0x3ff,
1700                                                   data[i] & 2 ? (data[i] & 1 ?
1701                                                                  "y-tiled" :
1702                                                                  "x-tiled") :
1703                                                   "");
1704                                         i++;
1705                                         instr_out(data, hw_offset, i,
1706                                                   "TM%dS2: pitch=%i, \n",
1707                                                   word - 11,
1708                                                   ((data[i] >> 21) + 1) * 4);
1709                                         i++;
1710                                         instr_out(data, hw_offset, i++,
1711                                                   "TM%dS3\n", word - 11);
1712                                         instr_out(data, hw_offset, i++,
1713                                                   "TM%dS4: dflt color\n",
1714                                                   word - 11);
1715                                 }
1716                         }
1717                 }
1718                 if (len != i) {
1719                         fprintf(out,
1720                                 "Bad count in 3DSTATE_LOAD_STATE_IMMEDIATE_2\n");
1721                 }
1722                 return len;
1723         case 0x00:
1724                 instr_out(data, hw_offset, 0, "3DSTATE_MAP_STATE\n");
1725                 len = (data[0] & 0x0000003f) + 2;
1726                 instr_out(data, hw_offset, 1, "mask\n");
1727
1728                 i = 2;
1729                 for (map = 0; map <= 15; map++) {
1730                         if (data[1] & (1 << map)) {
1731                                 int width, height, pitch, dword;
1732                                 const char *tiling;
1733
1734                                 if (i + 3 >= count)
1735                                         BUFFER_FAIL(count, len,
1736                                                     "3DSTATE_MAP_STATE");
1737
1738                                 dword = data[i];
1739                                 instr_out(data, hw_offset, i++,
1740                                           "map %d MS2 %s%s%s\n", map,
1741                                           dword & (1 << 31) ?
1742                                           "untrusted surface, " : "",
1743                                           dword & (1 << 1) ?
1744                                           "vertical line stride enable, " : "",
1745                                           dword & (1 << 0) ?
1746                                           "vertical ofs enable, " : "");
1747
1748                                 dword = data[i];
1749                                 width = ((dword >> 10) & ((1 << 11) - 1)) + 1;
1750                                 height = ((dword >> 21) & ((1 << 11) - 1)) + 1;
1751
1752                                 tiling = "none";
1753                                 if (dword & (1 << 2))
1754                                         tiling = "fenced";
1755                                 else if (dword & (1 << 1))
1756                                         tiling = dword & (1 << 0) ? "Y" : "X";
1757                                 type = " BAD";
1758                                 format = "BAD";
1759                                 switch ((dword >> 7) & 0x7) {
1760                                 case 1:
1761                                         type = "8b";
1762                                         switch ((dword >> 3) & 0xf) {
1763                                         case 0:
1764                                                 format = "I";
1765                                                 break;
1766                                         case 1:
1767                                                 format = "L";
1768                                                 break;
1769                                         case 4:
1770                                                 format = "A";
1771                                                 break;
1772                                         case 5:
1773                                                 format = " mono";
1774                                                 break;
1775                                         }
1776                                         break;
1777                                 case 2:
1778                                         type = "16b";
1779                                         switch ((dword >> 3) & 0xf) {
1780                                         case 0:
1781                                                 format = " rgb565";
1782                                                 break;
1783                                         case 1:
1784                                                 format = " argb1555";
1785                                                 break;
1786                                         case 2:
1787                                                 format = " argb4444";
1788                                                 break;
1789                                         case 5:
1790                                                 format = " ay88";
1791                                                 break;
1792                                         case 6:
1793                                                 format = " bump655";
1794                                                 break;
1795                                         case 7:
1796                                                 format = "I";
1797                                                 break;
1798                                         case 8:
1799                                                 format = "L";
1800                                                 break;
1801                                         case 9:
1802                                                 format = "A";
1803                                                 break;
1804                                         }
1805                                         break;
1806                                 case 3:
1807                                         type = "32b";
1808                                         switch ((dword >> 3) & 0xf) {
1809                                         case 0:
1810                                                 format = " argb8888";
1811                                                 break;
1812                                         case 1:
1813                                                 format = " abgr8888";
1814                                                 break;
1815                                         case 2:
1816                                                 format = " xrgb8888";
1817                                                 break;
1818                                         case 3:
1819                                                 format = " xbgr8888";
1820                                                 break;
1821                                         case 4:
1822                                                 format = " qwvu8888";
1823                                                 break;
1824                                         case 5:
1825                                                 format = " axvu8888";
1826                                                 break;
1827                                         case 6:
1828                                                 format = " lxvu8888";
1829                                                 break;
1830                                         case 7:
1831                                                 format = " xlvu8888";
1832                                                 break;
1833                                         case 8:
1834                                                 format = " argb2101010";
1835                                                 break;
1836                                         case 9:
1837                                                 format = " abgr2101010";
1838                                                 break;
1839                                         case 10:
1840                                                 format = " awvu2101010";
1841                                                 break;
1842                                         case 11:
1843                                                 format = " gr1616";
1844                                                 break;
1845                                         case 12:
1846                                                 format = " vu1616";
1847                                                 break;
1848                                         case 13:
1849                                                 format = " xI824";
1850                                                 break;
1851                                         case 14:
1852                                                 format = " xA824";
1853                                                 break;
1854                                         case 15:
1855                                                 format = " xL824";
1856                                                 break;
1857                                         }
1858                                         break;
1859                                 case 5:
1860                                         type = "422";
1861                                         switch ((dword >> 3) & 0xf) {
1862                                         case 0:
1863                                                 format = " yuv_swapy";
1864                                                 break;
1865                                         case 1:
1866                                                 format = " yuv";
1867                                                 break;
1868                                         case 2:
1869                                                 format = " yuv_swapuv";
1870                                                 break;
1871                                         case 3:
1872                                                 format = " yuv_swapuvy";
1873                                                 break;
1874                                         }
1875                                         break;
1876                                 case 6:
1877                                         type = "compressed";
1878                                         switch ((dword >> 3) & 0x7) {
1879                                         case 0:
1880                                                 format = " dxt1";
1881                                                 break;
1882                                         case 1:
1883                                                 format = " dxt2_3";
1884                                                 break;
1885                                         case 2:
1886                                                 format = " dxt4_5";
1887                                                 break;
1888                                         case 3:
1889                                                 format = " fxt1";
1890                                                 break;
1891                                         case 4:
1892                                                 format = " dxt1_rb";
1893                                                 break;
1894                                         }
1895                                         break;
1896                                 case 7:
1897                                         type = "4b indexed";
1898                                         switch ((dword >> 3) & 0xf) {
1899                                         case 7:
1900                                                 format = " argb8888";
1901                                                 break;
1902                                         }
1903                                         break;
1904                                 }
1905                                 dword = data[i];
1906                                 instr_out(data, hw_offset, i++,
1907                                           "map %d MS3 [width=%d, height=%d, format=%s%s, tiling=%s%s]\n",
1908                                           map, width, height, type, format,
1909                                           tiling,
1910                                           dword & (1 << 9) ? " palette select" :
1911                                           "");
1912
1913                                 dword = data[i];
1914                                 pitch =
1915                                     4 * (((dword >> 21) & ((1 << 11) - 1)) + 1);
1916                                 instr_out(data, hw_offset, i++,
1917                                           "map %d MS4 [pitch=%d, max_lod=%i, vol_depth=%i, cube_face_ena=%x, %s]\n",
1918                                           map, pitch, (dword >> 9) & 0x3f,
1919                                           dword & 0xff, (dword >> 15) & 0x3f,
1920                                           dword & (1 << 8) ? "miplayout legacy"
1921                                           : "miplayout right");
1922                         }
1923                 }
1924                 if (len != i) {
1925                         fprintf(out, "Bad count in 3DSTATE_MAP_STATE\n");
1926                         return len;
1927                 }
1928                 return len;
1929         case 0x06:
1930                 instr_out(data, hw_offset, 0,
1931                           "3DSTATE_PIXEL_SHADER_CONSTANTS\n");
1932                 len = (data[0] & 0x000000ff) + 2;
1933
1934                 i = 2;
1935                 for (c = 0; c <= 31; c++) {
1936                         if (data[1] & (1 << c)) {
1937                                 if (i + 4 >= count)
1938                                         BUFFER_FAIL(count, len,
1939                                                     "3DSTATE_PIXEL_SHADER_CONSTANTS");
1940                                 instr_out(data, hw_offset, i, "C%d.X = %f\n", c,
1941                                           int_as_float(data[i]));
1942                                 i++;
1943                                 instr_out(data, hw_offset, i, "C%d.Y = %f\n",
1944                                           c, int_as_float(data[i]));
1945                                 i++;
1946                                 instr_out(data, hw_offset, i, "C%d.Z = %f\n",
1947                                           c, int_as_float(data[i]));
1948                                 i++;
1949                                 instr_out(data, hw_offset, i, "C%d.W = %f\n",
1950                                           c, int_as_float(data[i]));
1951                                 i++;
1952                         }
1953                 }
1954                 if (len != i) {
1955                         fprintf(out,
1956                                 "Bad count in 3DSTATE_PIXEL_SHADER_CONSTANTS\n");
1957                 }
1958                 return len;
1959         case 0x05:
1960                 instr_out(data, hw_offset, 0, "3DSTATE_PIXEL_SHADER_PROGRAM\n");
1961                 len = (data[0] & 0x000000ff) + 2;
1962                 if ((len - 1) % 3 != 0 || len > 370) {
1963                         fprintf(out,
1964                                 "Bad count in 3DSTATE_PIXEL_SHADER_PROGRAM\n");
1965                 }
1966                 i = 1;
1967                 for (instr = 0; instr < (len - 1) / 3; instr++) {
1968                         char instr_prefix[10];
1969
1970                         if (i + 3 >= count)
1971                                 BUFFER_FAIL(count, len,
1972                                             "3DSTATE_PIXEL_SHADER_PROGRAM");
1973                         sprintf(instr_prefix, "PS%03d", instr);
1974                         i915_decode_instruction(data, hw_offset, i,
1975                                                 instr_prefix);
1976                         i += 3;
1977                 }
1978                 return len;
1979         case 0x01:
1980                 if (IS_GEN2(devid))
1981                         break;
1982                 instr_out(data, hw_offset, 0, "3DSTATE_SAMPLER_STATE\n");
1983                 instr_out(data, hw_offset, 1, "mask\n");
1984                 len = (data[0] & 0x0000003f) + 2;
1985                 i = 2;
1986                 for (sampler = 0; sampler <= 15; sampler++) {
1987                         if (data[1] & (1 << sampler)) {
1988                                 uint32_t dword;
1989                                 const char *mip_filter = "";
1990                                 if (i + 3 >= count)
1991                                         BUFFER_FAIL(count, len,
1992                                                     "3DSTATE_SAMPLER_STATE");
1993                                 dword = data[i];
1994                                 switch ((dword >> 20) & 0x3) {
1995                                 case 0:
1996                                         mip_filter = "none";
1997                                         break;
1998                                 case 1:
1999                                         mip_filter = "nearest";
2000                                         break;
2001                                 case 3:
2002                                         mip_filter = "linear";
2003                                         break;
2004                                 }
2005                                 instr_out(data, hw_offset, i++,
2006                                           "sampler %d SS2:%s%s%s "
2007                                           "base_mip_level=%i, mip_filter=%s, mag_filter=%s, min_filter=%s "
2008                                           "lod_bias=%.2f,%s max_aniso=%i, shadow_func=%s\n",
2009                                           sampler,
2010                                           dword & (1 << 31) ? " reverse gamma,"
2011                                           : "",
2012                                           dword & (1 << 30) ? " packed2planar,"
2013                                           : "",
2014                                           dword & (1 << 29) ?
2015                                           " colorspace conversion," : "",
2016                                           (dword >> 22) & 0x1f, mip_filter,
2017                                           decode_sample_filter(dword >> 17),
2018                                           decode_sample_filter(dword >> 14),
2019                                           ((dword >> 5) & 0x1ff) / (0x10 * 1.0),
2020                                           dword & (1 << 4) ? " shadow," : "",
2021                                           dword & (1 << 3) ? 4 : 2,
2022                                           decode_compare_func(dword));
2023                                 dword = data[i];
2024                                 instr_out(data, hw_offset, i++,
2025                                           "sampler %d SS3: min_lod=%.2f,%s "
2026                                           "tcmode_x=%s, tcmode_y=%s, tcmode_z=%s,%s texmap_idx=%i,%s\n",
2027                                           sampler,
2028                                           ((dword >> 24) & 0xff) / (0x10 * 1.0),
2029                                           dword & (1 << 17) ?
2030                                           " kill pixel enable," : "",
2031                                           decode_tex_coord_mode(dword >> 12),
2032                                           decode_tex_coord_mode(dword >> 9),
2033                                           decode_tex_coord_mode(dword >> 6),
2034                                           dword & (1 << 5) ?
2035                                           " normalized coords," : "",
2036                                           (dword >> 1) & 0xf,
2037                                           dword & (1 << 0) ? " deinterlacer," :
2038                                           "");
2039                                 dword = data[i];
2040                                 instr_out(data, hw_offset, i++,
2041                                           "sampler %d SS4: border color\n",
2042                                           sampler);
2043                         }
2044                 }
2045                 if (len != i) {
2046                         fprintf(out, "Bad count in 3DSTATE_SAMPLER_STATE\n");
2047                 }
2048                 return len;
2049         case 0x85:
2050                 len = (data[0] & 0x0000000f) + 2;
2051
2052                 if (len != 2)
2053                         fprintf(out,
2054                                 "Bad count in 3DSTATE_DEST_BUFFER_VARIABLES\n");
2055                 if (count < 2)
2056                         BUFFER_FAIL(count, len,
2057                                     "3DSTATE_DEST_BUFFER_VARIABLES");
2058
2059                 instr_out(data, hw_offset, 0,
2060                           "3DSTATE_DEST_BUFFER_VARIABLES\n");
2061
2062                 switch ((data[1] >> 8) & 0xf) {
2063                 case 0x0:
2064                         format = "g8";
2065                         break;
2066                 case 0x1:
2067                         format = "x1r5g5b5";
2068                         break;
2069                 case 0x2:
2070                         format = "r5g6b5";
2071                         break;
2072                 case 0x3:
2073                         format = "a8r8g8b8";
2074                         break;
2075                 case 0x4:
2076                         format = "ycrcb_swapy";
2077                         break;
2078                 case 0x5:
2079                         format = "ycrcb_normal";
2080                         break;
2081                 case 0x6:
2082                         format = "ycrcb_swapuv";
2083                         break;
2084                 case 0x7:
2085                         format = "ycrcb_swapuvy";
2086                         break;
2087                 case 0x8:
2088                         format = "a4r4g4b4";
2089                         break;
2090                 case 0x9:
2091                         format = "a1r5g5b5";
2092                         break;
2093                 case 0xa:
2094                         format = "a2r10g10b10";
2095                         break;
2096                 default:
2097                         format = "BAD";
2098                         break;
2099                 }
2100                 switch ((data[1] >> 2) & 0x3) {
2101                 case 0x0:
2102                         zformat = "u16";
2103                         break;
2104                 case 0x1:
2105                         zformat = "f16";
2106                         break;
2107                 case 0x2:
2108                         zformat = "u24x8";
2109                         break;
2110                 default:
2111                         zformat = "BAD";
2112                         break;
2113                 }
2114                 instr_out(data, hw_offset, 1,
2115                           "%s format, %s depth format, early Z %sabled\n",
2116                           format, zformat,
2117                           (data[1] & (1 << 31)) ? "en" : "dis");
2118                 return len;
2119
2120         case 0x8e:
2121                 {
2122                         const char *name, *tiling;
2123
2124                         len = (data[0] & 0x0000000f) + 2;
2125                         if (len != 3)
2126                                 fprintf(out,
2127                                         "Bad count in 3DSTATE_BUFFER_INFO\n");
2128                         if (count < 3)
2129                                 BUFFER_FAIL(count, len, "3DSTATE_BUFFER_INFO");
2130
2131                         switch ((data[1] >> 24) & 0x7) {
2132                         case 0x3:
2133                                 name = "color";
2134                                 break;
2135                         case 0x7:
2136                                 name = "depth";
2137                                 break;
2138                         default:
2139                                 name = "unknown";
2140                                 break;
2141                         }
2142
2143                         tiling = "none";
2144                         if (data[1] & (1 << 23))
2145                                 tiling = "fenced";
2146                         else if (data[1] & (1 << 22))
2147                                 tiling = data[1] & (1 << 21) ? "Y" : "X";
2148
2149                         instr_out(data, hw_offset, 0, "3DSTATE_BUFFER_INFO\n");
2150                         instr_out(data, hw_offset, 1,
2151                                   "%s, tiling = %s, pitch=%d\n", name, tiling,
2152                                   data[1] & 0xffff);
2153
2154                         instr_out(data, hw_offset, 2, "address\n");
2155                         return len;
2156                 }
2157         case 0x81:
2158                 len = (data[0] & 0x0000000f) + 2;
2159
2160                 if (len != 3)
2161                         fprintf(out,
2162                                 "Bad count in 3DSTATE_SCISSOR_RECTANGLE\n");
2163                 if (count < 3)
2164                         BUFFER_FAIL(count, len, "3DSTATE_SCISSOR_RECTANGLE");
2165
2166                 instr_out(data, hw_offset, 0, "3DSTATE_SCISSOR_RECTANGLE\n");
2167                 instr_out(data, hw_offset, 1, "(%d,%d)\n",
2168                           data[1] & 0xffff, data[1] >> 16);
2169                 instr_out(data, hw_offset, 2, "(%d,%d)\n",
2170                           data[2] & 0xffff, data[2] >> 16);
2171
2172                 return len;
2173         case 0x80:
2174                 len = (data[0] & 0x0000000f) + 2;
2175
2176                 if (len != 5)
2177                         fprintf(out,
2178                                 "Bad count in 3DSTATE_DRAWING_RECTANGLE\n");
2179                 if (count < 5)
2180                         BUFFER_FAIL(count, len, "3DSTATE_DRAWING_RECTANGLE");
2181
2182                 instr_out(data, hw_offset, 0, "3DSTATE_DRAWING_RECTANGLE\n");
2183                 instr_out(data, hw_offset, 1, "%s\n",
2184                           data[1] & (1 << 30) ? "depth ofs disabled " : "");
2185                 instr_out(data, hw_offset, 2, "(%d,%d)\n",
2186                           data[2] & 0xffff, data[2] >> 16);
2187                 instr_out(data, hw_offset, 3, "(%d,%d)\n",
2188                           data[3] & 0xffff, data[3] >> 16);
2189                 instr_out(data, hw_offset, 4, "(%d,%d)\n",
2190                           data[4] & 0xffff, data[4] >> 16);
2191
2192                 return len;
2193         case 0x9c:
2194                 len = (data[0] & 0x0000000f) + 2;
2195
2196                 if (len != 7)
2197                         fprintf(out, "Bad count in 3DSTATE_CLEAR_PARAMETERS\n");
2198                 if (count < 7)
2199                         BUFFER_FAIL(count, len, "3DSTATE_CLEAR_PARAMETERS");
2200
2201                 instr_out(data, hw_offset, 0, "3DSTATE_CLEAR_PARAMETERS\n");
2202                 instr_out(data, hw_offset, 1, "prim_type=%s, clear=%s%s%s\n",
2203                           data[1] & (1 << 16) ? "CLEAR_RECT" : "ZONE_INIT",
2204                           data[1] & (1 << 2) ? "color," : "",
2205                           data[1] & (1 << 1) ? "depth," : "",
2206                           data[1] & (1 << 0) ? "stencil," : "");
2207                 instr_out(data, hw_offset, 2, "clear color\n");
2208                 instr_out(data, hw_offset, 3, "clear depth/stencil\n");
2209                 instr_out(data, hw_offset, 4, "color value (rgba8888)\n");
2210                 instr_out(data, hw_offset, 5, "depth value %f\n",
2211                           int_as_float(data[5]));
2212                 instr_out(data, hw_offset, 6, "clear stencil\n");
2213                 return len;
2214         }
2215
2216         for (idx = 0; idx < ARRAY_SIZE(opcodes_3d_1d); idx++) {
2217                 opcode_3d_1d = &opcodes_3d_1d[idx];
2218                 if (opcode_3d_1d->i830_only && !IS_GEN2(devid))
2219                         continue;
2220
2221                 if (((data[0] & 0x00ff0000) >> 16) == opcode_3d_1d->opcode) {
2222                         len = 1;
2223
2224                         instr_out(data, hw_offset, 0, "%s\n",
2225                                   opcode_3d_1d->name);
2226                         if (opcode_3d_1d->max_len > 1) {
2227                                 len = (data[0] & 0x0000ffff) + 2;
2228                                 if (len < opcode_3d_1d->min_len ||
2229                                     len > opcode_3d_1d->max_len) {
2230                                         fprintf(out, "Bad count in %s\n",
2231                                                 opcode_3d_1d->name);
2232                                 }
2233                         }
2234
2235                         for (i = 1; i < len; i++) {
2236                                 if (i >= count)
2237                                         BUFFER_FAIL(count, len,
2238                                                     opcode_3d_1d->name);
2239                                 instr_out(data, hw_offset, i, "dword %d\n", i);
2240                         }
2241
2242                         return len;
2243                 }
2244         }
2245
2246         instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_1d opcode = 0x%x\n",
2247                   opcode);
2248         return 1;
2249 }
2250
2251 static int
2252 decode_3d_primitive(struct drm_intel_decode *ctx)
2253 {
2254         uint32_t *data = ctx->data;
2255         uint32_t hw_offset = ctx->hw_offset;
2256         uint32_t count = ctx->count;
2257         char immediate = (data[0] & (1 << 23)) == 0;
2258         unsigned int len, i, j, ret;
2259         const char *primtype;
2260         int original_s2 = saved_s2;
2261         int original_s4 = saved_s4;
2262
2263         switch ((data[0] >> 18) & 0xf) {
2264         case 0x0:
2265                 primtype = "TRILIST";
2266                 break;
2267         case 0x1:
2268                 primtype = "TRISTRIP";
2269                 break;
2270         case 0x2:
2271                 primtype = "TRISTRIP_REVERSE";
2272                 break;
2273         case 0x3:
2274                 primtype = "TRIFAN";
2275                 break;
2276         case 0x4:
2277                 primtype = "POLYGON";
2278                 break;
2279         case 0x5:
2280                 primtype = "LINELIST";
2281                 break;
2282         case 0x6:
2283                 primtype = "LINESTRIP";
2284                 break;
2285         case 0x7:
2286                 primtype = "RECTLIST";
2287                 break;
2288         case 0x8:
2289                 primtype = "POINTLIST";
2290                 break;
2291         case 0x9:
2292                 primtype = "DIB";
2293                 break;
2294         case 0xa:
2295                 primtype = "CLEAR_RECT";
2296                 saved_s4 = 3 << 6;
2297                 saved_s2 = ~0;
2298                 break;
2299         default:
2300                 primtype = "unknown";
2301                 break;
2302         }
2303
2304         /* XXX: 3DPRIM_DIB not supported */
2305         if (immediate) {
2306                 len = (data[0] & 0x0003ffff) + 2;
2307                 instr_out(data, hw_offset, 0, "3DPRIMITIVE inline %s\n",
2308                           primtype);
2309                 if (count < len)
2310                         BUFFER_FAIL(count, len, "3DPRIMITIVE inline");
2311                 if (!saved_s2_set || !saved_s4_set) {
2312                         fprintf(out, "unknown vertex format\n");
2313                         for (i = 1; i < len; i++) {
2314                                 instr_out(data, hw_offset, i,
2315                                           "           vertex data (%f float)\n",
2316                                           int_as_float(data[i]));
2317                         }
2318                 } else {
2319                         unsigned int vertex = 0;
2320                         for (i = 1; i < len;) {
2321                                 unsigned int tc;
2322
2323 #define VERTEX_OUT(fmt, ...) do {                                       \
2324     if (i < len)                                                        \
2325         instr_out(data, hw_offset, i, " V%d."fmt"\n", vertex, __VA_ARGS__); \
2326     else                                                                \
2327         fprintf(out, " missing data in V%d\n", vertex);                 \
2328     i++;                                                                \
2329 } while (0)
2330
2331                                 VERTEX_OUT("X = %f", int_as_float(data[i]));
2332                                 VERTEX_OUT("Y = %f", int_as_float(data[i]));
2333                                 switch (saved_s4 >> 6 & 0x7) {
2334                                 case 0x1:
2335                                         VERTEX_OUT("Z = %f",
2336                                                    int_as_float(data[i]));
2337                                         break;
2338                                 case 0x2:
2339                                         VERTEX_OUT("Z = %f",
2340                                                    int_as_float(data[i]));
2341                                         VERTEX_OUT("W = %f",
2342                                                    int_as_float(data[i]));
2343                                         break;
2344                                 case 0x3:
2345                                         break;
2346                                 case 0x4:
2347                                         VERTEX_OUT("W = %f",
2348                                                    int_as_float(data[i]));
2349                                         break;
2350                                 default:
2351                                         fprintf(out, "bad S4 position mask\n");
2352                                 }
2353
2354                                 if (saved_s4 & (1 << 10)) {
2355                                         VERTEX_OUT
2356                                             ("color = (A=0x%02x, R=0x%02x, G=0x%02x, "
2357                                              "B=0x%02x)", data[i] >> 24,
2358                                              (data[i] >> 16) & 0xff,
2359                                              (data[i] >> 8) & 0xff,
2360                                              data[i] & 0xff);
2361                                 }
2362                                 if (saved_s4 & (1 << 11)) {
2363                                         VERTEX_OUT
2364                                             ("spec = (A=0x%02x, R=0x%02x, G=0x%02x, "
2365                                              "B=0x%02x)", data[i] >> 24,
2366                                              (data[i] >> 16) & 0xff,
2367                                              (data[i] >> 8) & 0xff,
2368                                              data[i] & 0xff);
2369                                 }
2370                                 if (saved_s4 & (1 << 12))
2371                                         VERTEX_OUT("width = 0x%08x)", data[i]);
2372
2373                                 for (tc = 0; tc <= 7; tc++) {
2374                                         switch ((saved_s2 >> (tc * 4)) & 0xf) {
2375                                         case 0x0:
2376                                                 VERTEX_OUT("T%d.X = %f", tc,
2377                                                            int_as_float(data
2378                                                                         [i]));
2379                                                 VERTEX_OUT("T%d.Y = %f", tc,
2380                                                            int_as_float(data
2381                                                                         [i]));
2382                                                 break;
2383                                         case 0x1:
2384                                                 VERTEX_OUT("T%d.X = %f", tc,
2385                                                            int_as_float(data
2386                                                                         [i]));
2387                                                 VERTEX_OUT("T%d.Y = %f", tc,
2388                                                            int_as_float(data
2389                                                                         [i]));
2390                                                 VERTEX_OUT("T%d.Z = %f", tc,
2391                                                            int_as_float(data
2392                                                                         [i]));
2393                                                 break;
2394                                         case 0x2:
2395                                                 VERTEX_OUT("T%d.X = %f", tc,
2396                                                            int_as_float(data
2397                                                                         [i]));
2398                                                 VERTEX_OUT("T%d.Y = %f", tc,
2399                                                            int_as_float(data
2400                                                                         [i]));
2401                                                 VERTEX_OUT("T%d.Z = %f", tc,
2402                                                            int_as_float(data
2403                                                                         [i]));
2404                                                 VERTEX_OUT("T%d.W = %f", tc,
2405                                                            int_as_float(data
2406                                                                         [i]));
2407                                                 break;
2408                                         case 0x3:
2409                                                 VERTEX_OUT("T%d.X = %f", tc,
2410                                                            int_as_float(data
2411                                                                         [i]));
2412                                                 break;
2413                                         case 0x4:
2414                                                 VERTEX_OUT
2415                                                     ("T%d.XY = 0x%08x half-float",
2416                                                      tc, data[i]);
2417                                                 break;
2418                                         case 0x5:
2419                                                 VERTEX_OUT
2420                                                     ("T%d.XY = 0x%08x half-float",
2421                                                      tc, data[i]);
2422                                                 VERTEX_OUT
2423                                                     ("T%d.ZW = 0x%08x half-float",
2424                                                      tc, data[i]);
2425                                                 break;
2426                                         case 0xf:
2427                                                 break;
2428                                         default:
2429                                                 fprintf(out,
2430                                                         "bad S2.T%d format\n",
2431                                                         tc);
2432                                         }
2433                                 }
2434                                 vertex++;
2435                         }
2436                 }
2437
2438                 ret = len;
2439         } else {
2440                 /* indirect vertices */
2441                 len = data[0] & 0x0000ffff;     /* index count */
2442                 if (data[0] & (1 << 17)) {
2443                         /* random vertex access */
2444                         if (count < (len + 1) / 2 + 1) {
2445                                 BUFFER_FAIL(count, (len + 1) / 2 + 1,
2446                                             "3DPRIMITIVE random indirect");
2447                         }
2448                         instr_out(data, hw_offset, 0,
2449                                   "3DPRIMITIVE random indirect %s (%d)\n",
2450                                   primtype, len);
2451                         if (len == 0) {
2452                                 /* vertex indices continue until 0xffff is
2453                                  * found
2454                                  */
2455                                 for (i = 1; i < count; i++) {
2456                                         if ((data[i] & 0xffff) == 0xffff) {
2457                                                 instr_out(data, hw_offset, i,
2458                                                           "    indices: (terminator)\n");
2459                                                 ret = i;
2460                                                 goto out;
2461                                         } else if ((data[i] >> 16) == 0xffff) {
2462                                                 instr_out(data, hw_offset, i,
2463                                                           "    indices: 0x%04x, (terminator)\n",
2464                                                           data[i] & 0xffff);
2465                                                 ret = i;
2466                                                 goto out;
2467                                         } else {
2468                                                 instr_out(data, hw_offset, i,
2469                                                           "    indices: 0x%04x, 0x%04x\n",
2470                                                           data[i] & 0xffff,
2471                                                           data[i] >> 16);
2472                                         }
2473                                 }
2474                                 fprintf(out,
2475                                         "3DPRIMITIVE: no terminator found in index buffer\n");
2476                                 ret = count;
2477                                 goto out;
2478                         } else {
2479                                 /* fixed size vertex index buffer */
2480                                 for (j = 1, i = 0; i < len; i += 2, j++) {
2481                                         if (i * 2 == len - 1) {
2482                                                 instr_out(data, hw_offset, j,
2483                                                           "    indices: 0x%04x\n",
2484                                                           data[j] & 0xffff);
2485                                         } else {
2486                                                 instr_out(data, hw_offset, j,
2487                                                           "    indices: 0x%04x, 0x%04x\n",
2488                                                           data[j] & 0xffff,
2489                                                           data[j] >> 16);
2490                                         }
2491                                 }
2492                         }
2493                         ret = (len + 1) / 2 + 1;
2494                         goto out;
2495                 } else {
2496                         /* sequential vertex access */
2497                         if (count < 2)
2498                                 BUFFER_FAIL(count, 2,
2499                                             "3DPRIMITIVE seq indirect");
2500                         instr_out(data, hw_offset, 0,
2501                                   "3DPRIMITIVE sequential indirect %s, %d starting from "
2502                                   "%d\n", primtype, len, data[1] & 0xffff);
2503                         instr_out(data, hw_offset, 1, "           start\n");
2504                         ret = 2;
2505                         goto out;
2506                 }
2507         }
2508
2509 out:
2510         saved_s2 = original_s2;
2511         saved_s4 = original_s4;
2512         return ret;
2513 }
2514
2515 static int
2516 decode_3d(struct drm_intel_decode *ctx)
2517 {
2518         uint32_t opcode;
2519         unsigned int idx;
2520         uint32_t *data = ctx->data;
2521         uint32_t hw_offset = ctx->hw_offset;
2522         uint32_t count = ctx->count;
2523
2524         struct {
2525                 uint32_t opcode;
2526                 unsigned int min_len;
2527                 unsigned int max_len;
2528                 const char *name;
2529         } opcodes_3d[] = {
2530                 { 0x06, 1, 1, "3DSTATE_ANTI_ALIASING" },
2531                 { 0x08, 1, 1, "3DSTATE_BACKFACE_STENCIL_OPS" },
2532                 { 0x09, 1, 1, "3DSTATE_BACKFACE_STENCIL_MASKS" },
2533                 { 0x16, 1, 1, "3DSTATE_COORD_SET_BINDINGS" },
2534                 { 0x15, 1, 1, "3DSTATE_FOG_COLOR" },
2535                 { 0x0b, 1, 1, "3DSTATE_INDEPENDENT_ALPHA_BLEND" },
2536                 { 0x0d, 1, 1, "3DSTATE_MODES_4" },
2537                 { 0x0c, 1, 1, "3DSTATE_MODES_5" },
2538                 { 0x07, 1, 1, "3DSTATE_RASTERIZATION_RULES"},
2539         }, *opcode_3d;
2540
2541         opcode = (data[0] & 0x1f000000) >> 24;
2542
2543         switch (opcode) {
2544         case 0x1f:
2545                 return decode_3d_primitive(ctx);
2546         case 0x1d:
2547                 return decode_3d_1d(ctx);
2548         case 0x1c:
2549                 return decode_3d_1c(ctx);
2550         }
2551
2552         for (idx = 0; idx < ARRAY_SIZE(opcodes_3d); idx++) {
2553                 opcode_3d = &opcodes_3d[idx];
2554                 if (opcode == opcode_3d->opcode) {
2555                         unsigned int len = 1, i;
2556
2557                         instr_out(data, hw_offset, 0, "%s\n", opcode_3d->name);
2558                         if (opcode_3d->max_len > 1) {
2559                                 len = (data[0] & 0xff) + 2;
2560                                 if (len < opcode_3d->min_len ||
2561                                     len > opcode_3d->max_len) {
2562                                         fprintf(out, "Bad count in %s\n",
2563                                                 opcode_3d->name);
2564                                 }
2565                         }
2566
2567                         for (i = 1; i < len; i++) {
2568                                 if (i >= count)
2569                                         BUFFER_FAIL(count, len,
2570                                                     opcode_3d->name);
2571                                 instr_out(data, hw_offset, i, "dword %d\n", i);
2572                         }
2573                         return len;
2574                 }
2575         }
2576
2577         instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d opcode = 0x%x\n", opcode);
2578         return 1;
2579 }
2580
2581 static const char *get_965_surfacetype(unsigned int surfacetype)
2582 {
2583         switch (surfacetype) {
2584         case 0:
2585                 return "1D";
2586         case 1:
2587                 return "2D";
2588         case 2:
2589                 return "3D";
2590         case 3:
2591                 return "CUBE";
2592         case 4:
2593                 return "BUFFER";
2594         case 7:
2595                 return "NULL";
2596         default:
2597                 return "unknown";
2598         }
2599 }
2600
2601 static const char *get_965_depthformat(unsigned int depthformat)
2602 {
2603         switch (depthformat) {
2604         case 0:
2605                 return "s8_z24float";
2606         case 1:
2607                 return "z32float";
2608         case 2:
2609                 return "z24s8";
2610         case 5:
2611                 return "z16";
2612         default:
2613                 return "unknown";
2614         }
2615 }
2616
2617 static const char *get_965_element_component(uint32_t data, int component)
2618 {
2619         uint32_t component_control = (data >> (16 + (3 - component) * 4)) & 0x7;
2620
2621         switch (component_control) {
2622         case 0:
2623                 return "nostore";
2624         case 1:
2625                 switch (component) {
2626                 case 0:
2627                         return "X";
2628                 case 1:
2629                         return "Y";
2630                 case 2:
2631                         return "Z";
2632                 case 3:
2633                         return "W";
2634                 default:
2635                         return "fail";
2636                 }
2637         case 2:
2638                 return "0.0";
2639         case 3:
2640                 return "1.0";
2641         case 4:
2642                 return "0x1";
2643         case 5:
2644                 return "VID";
2645         default:
2646                 return "fail";
2647         }
2648 }
2649
2650 static const char *get_965_prim_type(uint32_t data)
2651 {
2652         uint32_t primtype = (data >> 10) & 0x1f;
2653
2654         switch (primtype) {
2655         case 0x01:
2656                 return "point list";
2657         case 0x02:
2658                 return "line list";
2659         case 0x03:
2660                 return "line strip";
2661         case 0x04:
2662                 return "tri list";
2663         case 0x05:
2664                 return "tri strip";
2665         case 0x06:
2666                 return "tri fan";
2667         case 0x07:
2668                 return "quad list";
2669         case 0x08:
2670                 return "quad strip";
2671         case 0x09:
2672                 return "line list adj";
2673         case 0x0a:
2674                 return "line strip adj";
2675         case 0x0b:
2676                 return "tri list adj";
2677         case 0x0c:
2678                 return "tri strip adj";
2679         case 0x0d:
2680                 return "tri strip reverse";
2681         case 0x0e:
2682                 return "polygon";
2683         case 0x0f:
2684                 return "rect list";
2685         case 0x10:
2686                 return "line loop";
2687         case 0x11:
2688                 return "point list bf";
2689         case 0x12:
2690                 return "line strip cont";
2691         case 0x13:
2692                 return "line strip bf";
2693         case 0x14:
2694                 return "line strip cont bf";
2695         case 0x15:
2696                 return "tri fan no stipple";
2697         default:
2698                 return "fail";
2699         }
2700 }
2701
2702 static int
2703 i965_decode_urb_fence(uint32_t *data, uint32_t hw_offset, int len,
2704                       uint32_t count)
2705 {
2706         uint32_t vs_fence, clip_fence, gs_fence, sf_fence, vfe_fence, cs_fence;
2707
2708         if (len != 3)
2709                 fprintf(out, "Bad count in URB_FENCE\n");
2710         if (count < 3)
2711                 BUFFER_FAIL(count, len, "URB_FENCE");
2712
2713         vs_fence = data[1] & 0x3ff;
2714         gs_fence = (data[1] >> 10) & 0x3ff;
2715         clip_fence = (data[1] >> 20) & 0x3ff;
2716         sf_fence = data[2] & 0x3ff;
2717         vfe_fence = (data[2] >> 10) & 0x3ff;
2718         cs_fence = (data[2] >> 20) & 0x7ff;
2719
2720         instr_out(data, hw_offset, 0, "URB_FENCE: %s%s%s%s%s%s\n",
2721                   (data[0] >> 13) & 1 ? "cs " : "",
2722                   (data[0] >> 12) & 1 ? "vfe " : "",
2723                   (data[0] >> 11) & 1 ? "sf " : "",
2724                   (data[0] >> 10) & 1 ? "clip " : "",
2725                   (data[0] >> 9) & 1 ? "gs " : "",
2726                   (data[0] >> 8) & 1 ? "vs " : "");
2727         instr_out(data, hw_offset, 1,
2728                   "vs fence: %d, clip_fence: %d, gs_fence: %d\n",
2729                   vs_fence, clip_fence, gs_fence);
2730         instr_out(data, hw_offset, 2,
2731                   "sf fence: %d, vfe_fence: %d, cs_fence: %d\n",
2732                   sf_fence, vfe_fence, cs_fence);
2733         if (gs_fence < vs_fence)
2734                 fprintf(out, "gs fence < vs fence!\n");
2735         if (clip_fence < gs_fence)
2736                 fprintf(out, "clip fence < gs fence!\n");
2737         if (sf_fence < clip_fence)
2738                 fprintf(out, "sf fence < clip fence!\n");
2739         if (cs_fence < sf_fence)
2740                 fprintf(out, "cs fence < sf fence!\n");
2741
2742         return len;
2743 }
2744
2745 static void
2746 state_base_out(uint32_t *data, uint32_t hw_offset, unsigned int index,
2747                const char *name)
2748 {
2749         if (data[index] & 1) {
2750                 instr_out(data, hw_offset, index,
2751                           "%s state base address 0x%08x\n", name,
2752                           data[index] & ~1);
2753         } else {
2754                 instr_out(data, hw_offset, index, "%s state base not updated\n",
2755                           name);
2756         }
2757 }
2758
2759 static void
2760 state_max_out(uint32_t *data, uint32_t hw_offset, unsigned int index,
2761               const char *name)
2762 {
2763         if (data[index] & 1) {
2764                 if (data[index] == 1) {
2765                         instr_out(data, hw_offset, index,
2766                                   "%s state upper bound disabled\n", name);
2767                 } else {
2768                         instr_out(data, hw_offset, index,
2769                                   "%s state upper bound 0x%08x\n", name,
2770                                   data[index] & ~1);
2771                 }
2772         } else {
2773                 instr_out(data, hw_offset, index,
2774                           "%s state upper bound not updated\n", name);
2775         }
2776 }
2777
2778 static int
2779 decode_3d_965(struct drm_intel_decode *ctx)
2780 {
2781         uint32_t opcode;
2782         unsigned int idx, len;
2783         unsigned int i, j, sba_len;
2784         const char *desc1 = NULL;
2785         uint32_t *data = ctx->data;
2786         uint32_t hw_offset = ctx->hw_offset;
2787         uint32_t count = ctx->count;
2788         uint32_t devid = ctx->devid;
2789
2790         struct {
2791                 uint32_t opcode;
2792                 int unsigned min_len;
2793                 int unsigned max_len;
2794                 const char *name;
2795         } opcodes_3d[] = {
2796                 { 0x6000, 3, 3, "URB_FENCE" },
2797                 { 0x6001, 2, 2, "CS_URB_STATE" },
2798                 { 0x6002, 2, 2, "CONSTANT_BUFFER" },
2799                 { 0x6101, 6, 6, "STATE_BASE_ADDRESS" },
2800                 { 0x6102, 2, 2, "STATE_SIP" },
2801                 { 0x6104, 1, 1, "3DSTATE_PIPELINE_SELECT" },
2802                 { 0x680b, 1, 1, "3DSTATE_VF_STATISTICS" },
2803                 { 0x6904, 1, 1, "3DSTATE_PIPELINE_SELECT" },
2804                 { 0x7800, 7, 7, "3DSTATE_PIPELINED_POINTERS" },
2805                 { 0x7801, 6, 6, "3DSTATE_BINDING_TABLE_POINTERS" },
2806                 { 0x7808, 5, 257, "3DSTATE_VERTEX_BUFFERS" },
2807                 { 0x7809, 3, 256, "3DSTATE_VERTEX_ELEMENTS" },
2808                 { 0x780a, 3, 3, "3DSTATE_INDEX_BUFFER" },
2809                 { 0x780b, 1, 1, "3DSTATE_VF_STATISTICS" },
2810                 { 0x7900, 4, 4, "3DSTATE_DRAWING_RECTANGLE" },
2811                 { 0x7901, 5, 5, "3DSTATE_CONSTANT_COLOR" },
2812                 { 0x7905, 5, 7, "3DSTATE_DEPTH_BUFFER" },
2813                 { 0x7906, 2, 2, "3DSTATE_POLY_STIPPLE_OFFSET" },
2814                 { 0x7907, 33, 33, "3DSTATE_POLY_STIPPLE_PATTERN" },
2815                 { 0x7908, 3, 3, "3DSTATE_LINE_STIPPLE" },
2816                 { 0x7909, 2, 2, "3DSTATE_GLOBAL_DEPTH_OFFSET_CLAMP" },
2817                 { 0x7909, 2, 2, "3DSTATE_CLEAR_PARAMS" },
2818                 { 0x790a, 3, 3, "3DSTATE_AA_LINE_PARAMETERS" },
2819                 { 0x790b, 4, 4, "3DSTATE_GS_SVB_INDEX" },
2820                 { 0x790d, 3, 3, "3DSTATE_MULTISAMPLE" },
2821                 { 0x7910, 2, 2, "3DSTATE_CLEAR_PARAMS" },
2822                 { 0x7b00, 6, 6, "3DPRIMITIVE" },
2823                 { 0x7802, 4, 4, "3DSTATE_SAMPLER_STATE_POINTERS" },
2824                 { 0x7805, 3, 3, "3DSTATE_URB" },
2825                 { 0x780d, 4, 4, "3DSTATE_VIEWPORT_STATE_POINTERS" },
2826                 { 0x780e, 4, 4, "3DSTATE_CC_STATE_POINTERS" },
2827                 { 0x780f, 2, 2, "3DSTATE_SCISSOR_STATE_POINTERS" },
2828                 { 0x7810, 6, 6, "3DSTATE_VS_STATE" },
2829                 { 0x7811, 7, 7, "3DSTATE_GS_STATE" },
2830                 { 0x7812, 4, 4, "3DSTATE_CLIP_STATE" },
2831                 { 0x7813, 20, 20, "3DSTATE_SF_STATE" },
2832                 { 0x7814, 9, 9, "3DSTATE_WM_STATE" },
2833                 { 0x7815, 5, 5, "3DSTATE_CONSTANT_VS_STATE" },
2834                 { 0x7816, 5, 5, "3DSTATE_CONSTANT_GS_STATE" },
2835                 { 0x7817, 5, 5, "3DSTATE_CONSTANT_PS_STATE" },
2836                 { 0x7818, 2, 2, "3DSTATE_SAMPLE_MASK"},
2837         }, *opcode_3d;
2838
2839         len = (data[0] & 0x0000ffff) + 2;
2840
2841         opcode = (data[0] & 0xffff0000) >> 16;
2842         switch (opcode) {
2843         case 0x6000:
2844                 len = (data[0] & 0x000000ff) + 2;
2845                 return i965_decode_urb_fence(data, hw_offset, len, count);
2846         case 0x6001:
2847                 instr_out(data, hw_offset, 0, "CS_URB_STATE\n");
2848                 instr_out(data, hw_offset, 1,
2849                           "entry_size: %d [%d bytes], n_entries: %d\n",
2850                           (data[1] >> 4) & 0x1f,
2851                           (((data[1] >> 4) & 0x1f) + 1) * 64, data[1] & 0x7);
2852                 return len;
2853         case 0x6002:
2854                 len = (data[0] & 0x000000ff) + 2;
2855                 instr_out(data, hw_offset, 0, "CONSTANT_BUFFER: %s\n",
2856                           (data[0] >> 8) & 1 ? "valid" : "invalid");
2857                 instr_out(data, hw_offset, 1,
2858                           "offset: 0x%08x, length: %d bytes\n", data[1] & ~0x3f,
2859                           ((data[1] & 0x3f) + 1) * 64);
2860                 return len;
2861         case 0x6101:
2862                 i = 0;
2863                 instr_out(data, hw_offset, 0, "STATE_BASE_ADDRESS\n");
2864                 i++;
2865
2866                 if (IS_GEN6(devid) || IS_GEN7(devid))
2867                         sba_len = 10;
2868                 else if (IS_GEN5(devid))
2869                         sba_len = 8;
2870                 else
2871                         sba_len = 6;
2872                 if (len != sba_len)
2873                         fprintf(out, "Bad count in STATE_BASE_ADDRESS\n");
2874                 if (len != sba_len)
2875                         BUFFER_FAIL(count, len, "STATE_BASE_ADDRESS");
2876
2877                 state_base_out(data, hw_offset, i++, "general");
2878                 state_base_out(data, hw_offset, i++, "surface");
2879                 if (IS_GEN6(devid) || IS_GEN7(devid))
2880                         state_base_out(data, hw_offset, i++, "dynamic");
2881                 state_base_out(data, hw_offset, i++, "indirect");
2882                 if (IS_GEN5(devid) || IS_GEN6(devid) || IS_GEN7(devid))
2883                         state_base_out(data, hw_offset, i++, "instruction");
2884
2885                 state_max_out(data, hw_offset, i++, "general");
2886                 if (IS_GEN6(devid) || IS_GEN7(devid))
2887                         state_max_out(data, hw_offset, i++, "dynamic");
2888                 state_max_out(data, hw_offset, i++, "indirect");
2889                 if (IS_GEN5(devid) || IS_GEN6(devid) || IS_GEN7(devid))
2890                         state_max_out(data, hw_offset, i++, "instruction");
2891
2892                 return len;
2893         case 0x7800:
2894                 if (len != 7)
2895                         fprintf(out,
2896                                 "Bad count in 3DSTATE_PIPELINED_POINTERS\n");
2897                 if (count < 7)
2898                         BUFFER_FAIL(count, len, "3DSTATE_PIPELINED_POINTERS");
2899
2900                 instr_out(data, hw_offset, 0, "3DSTATE_PIPELINED_POINTERS\n");
2901                 instr_out(data, hw_offset, 1, "VS state\n");
2902                 instr_out(data, hw_offset, 2, "GS state\n");
2903                 instr_out(data, hw_offset, 3, "Clip state\n");
2904                 instr_out(data, hw_offset, 4, "SF state\n");
2905                 instr_out(data, hw_offset, 5, "WM state\n");
2906                 instr_out(data, hw_offset, 6, "CC state\n");
2907                 return len;
2908         case 0x7801:
2909                 len = (data[0] & 0x000000ff) + 2;
2910                 if (len != 6 && len != 4)
2911                         fprintf(out,
2912                                 "Bad count in 3DSTATE_BINDING_TABLE_POINTERS\n");
2913                 if (len == 6) {
2914                         if (count < 6)
2915                                 BUFFER_FAIL(count, len,
2916                                             "3DSTATE_BINDING_TABLE_POINTERS");
2917                         instr_out(data, hw_offset, 0,
2918                                   "3DSTATE_BINDING_TABLE_POINTERS\n");
2919                         instr_out(data, hw_offset, 1, "VS binding table\n");
2920                         instr_out(data, hw_offset, 2, "GS binding table\n");
2921                         instr_out(data, hw_offset, 3, "Clip binding table\n");
2922                         instr_out(data, hw_offset, 4, "SF binding table\n");
2923                         instr_out(data, hw_offset, 5, "WM binding table\n");
2924                 } else {
2925                         if (count < 4)
2926                                 BUFFER_FAIL(count, len,
2927                                             "3DSTATE_BINDING_TABLE_POINTERS");
2928
2929                         instr_out(data, hw_offset, 0,
2930                                   "3DSTATE_BINDING_TABLE_POINTERS: VS mod %d, "
2931                                   "GS mod %d, PS mod %d\n",
2932                                   (data[0] & (1 << 8)) != 0,
2933                                   (data[0] & (1 << 9)) != 0,
2934                                   (data[0] & (1 << 12)) != 0);
2935                         instr_out(data, hw_offset, 1, "VS binding table\n");
2936                         instr_out(data, hw_offset, 2, "GS binding table\n");
2937                         instr_out(data, hw_offset, 3, "WM binding table\n");
2938                 }
2939
2940                 return len;
2941         case 0x7802:
2942                 len = (data[0] & 0xff) + 2;
2943                 if (len != 4)
2944                         fprintf(out,
2945                                 "Bad count in 3DSTATE_SAMPLER_STATE_POINTERS\n");
2946                 if (count < 4)
2947                         BUFFER_FAIL(count, len,
2948                                     "3DSTATE_SAMPLER_STATE_POINTERS");
2949                 instr_out(data, hw_offset, 0,
2950                           "3DSTATE_SAMPLER_STATE_POINTERS: VS mod %d, "
2951                           "GS mod %d, PS mod %d\n", (data[0] & (1 << 8)) != 0,
2952                           (data[0] & (1 << 9)) != 0,
2953                           (data[0] & (1 << 12)) != 0);
2954                 instr_out(data, hw_offset, 1, "VS sampler state\n");
2955                 instr_out(data, hw_offset, 2, "GS sampler state\n");
2956                 instr_out(data, hw_offset, 3, "WM sampler state\n");
2957                 return len;
2958         case 0x7805:
2959                 len = (data[0] & 0xff) + 2;
2960                 if (len != 3)
2961                         fprintf(out, "Bad count in 3DSTATE_URB\n");
2962                 if (count < 3)
2963                         BUFFER_FAIL(count, len, "3DSTATE_URB");
2964                 instr_out(data, hw_offset, 0, "3DSTATE_URB\n");
2965                 instr_out(data, hw_offset, 1,
2966                           "VS entries %d, alloc size %d (1024bit row)\n",
2967                           data[1] & 0xffff, ((data[1] >> 16) & 0x07f) + 1);
2968                 instr_out(data, hw_offset, 2,
2969                           "GS entries %d, alloc size %d (1024bit row)\n",
2970                           (data[2] >> 8) & 0x3ff, (data[2] & 7) + 1);
2971                 return len;
2972
2973         case 0x7808:
2974                 len = (data[0] & 0xff) + 2;
2975                 if ((len - 1) % 4 != 0)
2976                         fprintf(out, "Bad count in 3DSTATE_VERTEX_BUFFERS\n");
2977                 if (count < len)
2978                         BUFFER_FAIL(count, len, "3DSTATE_VERTEX_BUFFERS");
2979                 instr_out(data, hw_offset, 0, "3DSTATE_VERTEX_BUFFERS\n");
2980
2981                 for (i = 1; i < len;) {
2982                         int idx, access;
2983                         if (IS_GEN6(devid)) {
2984                                 idx = 26;
2985                                 access = 20;
2986                         } else {
2987                                 idx = 27;
2988                                 access = 26;
2989                         }
2990                         instr_out(data, hw_offset, i,
2991                                   "buffer %d: %s, pitch %db\n", data[i] >> idx,
2992                                   data[i] & (1 << access) ? "random" :
2993                                   "sequential", data[i] & 0x07ff);
2994                         i++;
2995                         instr_out(data, hw_offset, i++, "buffer address\n");
2996                         instr_out(data, hw_offset, i++, "max index\n");
2997                         instr_out(data, hw_offset, i++, "mbz\n");
2998                 }
2999                 return len;
3000
3001         case 0x7809:
3002                 len = (data[0] & 0xff) + 2;
3003                 if ((len + 1) % 2 != 0)
3004                         fprintf(out, "Bad count in 3DSTATE_VERTEX_ELEMENTS\n");
3005                 if (count < len)
3006                         BUFFER_FAIL(count, len, "3DSTATE_VERTEX_ELEMENTS");
3007                 instr_out(data, hw_offset, 0, "3DSTATE_VERTEX_ELEMENTS\n");
3008
3009                 for (i = 1; i < len;) {
3010                         instr_out(data, hw_offset, i,
3011                                   "buffer %d: %svalid, type 0x%04x, "
3012                                   "src offset 0x%04x bytes\n",
3013                                   data[i] >> (IS_GEN6(devid) ? 26 : 27),
3014                                   data[i] & (1 << (IS_GEN6(devid) ? 25 : 26)) ?
3015                                   "" : "in", (data[i] >> 16) & 0x1ff,
3016                                   data[i] & 0x07ff);
3017                         i++;
3018                         instr_out(data, hw_offset, i, "(%s, %s, %s, %s), "
3019                                   "dst offset 0x%02x bytes\n",
3020                                   get_965_element_component(data[i], 0),
3021                                   get_965_element_component(data[i], 1),
3022                                   get_965_element_component(data[i], 2),
3023                                   get_965_element_component(data[i], 3),
3024                                   (data[i] & 0xff) * 4);
3025                         i++;
3026                 }
3027                 return len;
3028
3029         case 0x780d:
3030                 len = (data[0] & 0xff) + 2;
3031                 if (len != 4)
3032                         fprintf(out,
3033                                 "Bad count in 3DSTATE_VIEWPORT_STATE_POINTERS\n");
3034                 if (count < len)
3035                         BUFFER_FAIL(count, len,
3036                                     "3DSTATE_VIEWPORT_STATE_POINTERS");
3037                 instr_out(data, hw_offset, 0,
3038                           "3DSTATE_VIEWPORT_STATE_POINTERS\n");
3039                 instr_out(data, hw_offset, 1, "clip\n");
3040                 instr_out(data, hw_offset, 2, "sf\n");
3041                 instr_out(data, hw_offset, 3, "cc\n");
3042                 return len;
3043
3044         case 0x780a:
3045                 len = (data[0] & 0xff) + 2;
3046                 if (len != 3)
3047                         fprintf(out, "Bad count in 3DSTATE_INDEX_BUFFER\n");
3048                 if (count < len)
3049                         BUFFER_FAIL(count, len, "3DSTATE_INDEX_BUFFER");
3050                 instr_out(data, hw_offset, 0, "3DSTATE_INDEX_BUFFER\n");
3051                 instr_out(data, hw_offset, 1, "beginning buffer address\n");
3052                 instr_out(data, hw_offset, 2, "ending buffer address\n");
3053                 return len;
3054
3055         case 0x780e:
3056                 len = (data[0] & 0xff) + 2;
3057                 if (len != 4)
3058                         fprintf(out,
3059                                 "Bad count in 3DSTATE_CC_STATE_POINTERS\n");
3060                 if (count < 4)
3061                         BUFFER_FAIL(count, len, "3DSTATE_CC_STATE_POINTERS");
3062                 instr_out(data, hw_offset, 0, "3DSTATE_CC_STATE_POINTERS\n");
3063                 instr_out(data, hw_offset, 1, "blend change %d\n", data[1] & 1);
3064                 instr_out(data, hw_offset, 2, "depth stencil change %d\n",
3065                           data[2] & 1);
3066                 instr_out(data, hw_offset, 3, "cc change %d\n", data[3] & 1);
3067                 return len;
3068
3069         case 0x780f:
3070                 len = (data[0] & 0xff) + 2;
3071                 if (len != 2)
3072                         fprintf(out, "Bad count in 3DSTATE_SCISSOR_POINTERS\n");
3073                 if (count < 2)
3074                         BUFFER_FAIL(count, len, "3DSTATE_SCISSOR_POINTERS");
3075                 instr_out(data, hw_offset, 0, "3DSTATE_SCISSOR_POINTERS\n");
3076                 instr_out(data, hw_offset, 1, "scissor rect offset\n");
3077                 return len;
3078
3079         case 0x7810:
3080                 len = (data[0] & 0xff) + 2;
3081                 if (len != 6)
3082                         fprintf(out, "Bad count in 3DSTATE_VS\n");
3083                 if (count < 6)
3084                         BUFFER_FAIL(count, len, "3DSTATE_VS");
3085                 instr_out(data, hw_offset, 0, "3DSTATE_VS\n");
3086                 instr_out(data, hw_offset, 1, "kernel pointer\n");
3087                 instr_out(data, hw_offset, 2,
3088                           "SPF=%d, VME=%d, Sampler Count %d, "
3089                           "Binding table count %d\n", (data[2] >> 31) & 1,
3090                           (data[2] >> 30) & 1, (data[2] >> 27) & 7,
3091                           (data[2] >> 18) & 0xff);
3092                 instr_out(data, hw_offset, 3, "scratch offset\n");
3093                 instr_out(data, hw_offset, 4,
3094                           "Dispatch GRF start %d, VUE read length %d, "
3095                           "VUE read offset %d\n", (data[4] >> 20) & 0x1f,
3096                           (data[4] >> 11) & 0x3f, (data[4] >> 4) & 0x3f);
3097                 instr_out(data, hw_offset, 5,
3098                           "Max Threads %d, Vertex Cache %sable, "
3099                           "VS func %sable\n", ((data[5] >> 25) & 0x7f) + 1,
3100                           (data[5] & (1 << 1)) != 0 ? "dis" : "en",
3101                           (data[5] & 1) != 0 ? "en" : "dis");
3102                 return len;
3103
3104         case 0x7811:
3105                 len = (data[0] & 0xff) + 2;
3106                 if (len != 7)
3107                         fprintf(out, "Bad count in 3DSTATE_GS\n");
3108                 if (count < 7)
3109                         BUFFER_FAIL(count, len, "3DSTATE_GS");
3110                 instr_out(data, hw_offset, 0, "3DSTATE_GS\n");
3111                 instr_out(data, hw_offset, 1, "kernel pointer\n");
3112                 instr_out(data, hw_offset, 2,
3113                           "SPF=%d, VME=%d, Sampler Count %d, "
3114                           "Binding table count %d\n", (data[2] >> 31) & 1,
3115                           (data[2] >> 30) & 1, (data[2] >> 27) & 7,
3116                           (data[2] >> 18) & 0xff);
3117                 instr_out(data, hw_offset, 3, "scratch offset\n");
3118                 instr_out(data, hw_offset, 4,
3119                           "Dispatch GRF start %d, VUE read length %d, "
3120                           "VUE read offset %d\n", (data[4] & 0xf),
3121                           (data[4] >> 11) & 0x3f, (data[4] >> 4) & 0x3f);
3122                 instr_out(data, hw_offset, 5,
3123                           "Max Threads %d, Rendering %sable\n",
3124                           ((data[5] >> 25) & 0x7f) + 1,
3125                           (data[5] & (1 << 8)) != 0 ? "en" : "dis");
3126                 instr_out(data, hw_offset, 6,
3127                           "Reorder %sable, Discard Adjaceny %sable, "
3128                           "GS %sable\n",
3129                           (data[6] & (1 << 30)) != 0 ? "en" : "dis",
3130                           (data[6] & (1 << 29)) != 0 ? "en" : "dis",
3131                           (data[6] & (1 << 15)) != 0 ? "en" : "dis");
3132                 return len;
3133
3134         case 0x7812:
3135                 len = (data[0] & 0xff) + 2;
3136                 if (len != 4)
3137                         fprintf(out, "Bad count in 3DSTATE_CLIP\n");
3138                 if (count < 4)
3139                         BUFFER_FAIL(count, len, "3DSTATE_CLIP");
3140                 instr_out(data, hw_offset, 0, "3DSTATE_CLIP\n");
3141                 instr_out(data, hw_offset, 1,
3142                           "UserClip distance cull test mask 0x%x\n",
3143                           data[1] & 0xff);
3144                 instr_out(data, hw_offset, 2,
3145                           "Clip %sable, API mode %s, Viewport XY test %sable, "
3146                           "Viewport Z test %sable, Guardband test %sable, Clip mode %d, "
3147                           "Perspective Divide %sable, Non-Perspective Barycentric %sable, "
3148                           "Tri Provoking %d, Line Provoking %d, Trifan Provoking %d\n",
3149                           (data[2] & (1 << 31)) != 0 ? "en" : "dis",
3150                           (data[2] & (1 << 30)) != 0 ? "D3D" : "OGL",
3151                           (data[2] & (1 << 28)) != 0 ? "en" : "dis",
3152                           (data[2] & (1 << 27)) != 0 ? "en" : "dis",
3153                           (data[2] & (1 << 26)) != 0 ? "en" : "dis",
3154                           (data[2] >> 13) & 7,
3155                           (data[2] & (1 << 9)) != 0 ? "dis" : "en",
3156                           (data[2] & (1 << 8)) != 0 ? "en" : "dis",
3157                           (data[2] >> 4) & 3, (data[2] >> 2) & 3,
3158                           (data[2] & 3));
3159                 instr_out(data, hw_offset, 3,
3160                           "Min PointWidth %d, Max PointWidth %d, "
3161                           "Force Zero RTAIndex %sable, Max VPIndex %d\n",
3162                           (data[3] >> 17) & 0x7ff, (data[3] >> 6) & 0x7ff,
3163                           (data[3] & (1 << 5)) != 0 ? "en" : "dis",
3164                           (data[3] & 0xf));
3165                 return len;
3166
3167         case 0x7813:
3168                 len = (data[0] & 0xff) + 2;
3169                 if (len != 20)
3170                         fprintf(out, "Bad count in 3DSTATE_SF\n");
3171                 if (count < 20)
3172                         BUFFER_FAIL(count, len, "3DSTATE_SF");
3173                 instr_out(data, hw_offset, 0, "3DSTATE_SF\n");
3174                 instr_out(data, hw_offset, 1,
3175                           "Attrib Out %d, Attrib Swizzle %sable, VUE read length %d, "
3176                           "VUE read offset %d\n", (data[1] >> 22) & 0x3f,
3177                           (data[1] & (1 << 21)) != 0 ? "en" : "dis",
3178                           (data[1] >> 11) & 0x1f, (data[1] >> 4) & 0x3f);
3179                 instr_out(data, hw_offset, 2,
3180                           "Legacy Global DepthBias %sable, FrontFace fill %d, BF fill %d, "
3181                           "VP transform %sable, FrontWinding_%s\n",
3182                           (data[2] & (1 << 11)) != 0 ? "en" : "dis",
3183                           (data[2] >> 5) & 3, (data[2] >> 3) & 3,
3184                           (data[2] & (1 << 1)) != 0 ? "en" : "dis",
3185                           (data[2] & 1) != 0 ? "CCW" : "CW");
3186                 instr_out(data, hw_offset, 3,
3187                           "AA %sable, CullMode %d, Scissor %sable, Multisample m ode %d\n",
3188                           (data[3] & (1 << 31)) != 0 ? "en" : "dis",
3189                           (data[3] >> 29) & 3,
3190                           (data[3] & (1 << 11)) != 0 ? "en" : "dis",
3191                           (data[3] >> 8) & 3);
3192                 instr_out(data, hw_offset, 4,
3193                           "Last Pixel %sable, SubPixel Precision %d, Use PixelWidth %d\n",
3194                           (data[4] & (1 << 31)) != 0 ? "en" : "dis",
3195                           (data[4] & (1 << 12)) != 0 ? 4 : 8,
3196                           (data[4] & (1 << 11)) != 0);
3197                 instr_out(data, hw_offset, 5,
3198                           "Global Depth Offset Constant %f\n",
3199                           *(float *)(&data[5]));
3200                 instr_out(data, hw_offset, 6, "Global Depth Offset Scale %f\n",
3201                           *(float *)(&data[6]));
3202                 instr_out(data, hw_offset, 7, "Global Depth Offset Clamp %f\n",
3203                           *(float *)(&data[7]));
3204
3205                 for (i = 0, j = 0; i < 8; i++, j += 2)
3206                         instr_out(data, hw_offset, i + 8,
3207                                   "Attrib %d (Override %s%s%s%s, Const Source %d, Swizzle Select %d, "
3208                                   "Source %d); Attrib %d (Override %s%s%s%s, Const Source %d, Swizzle Select %d, Source %d)\n",
3209                                   j + 1,
3210                                   (data[8 + i] & (1 << 31)) != 0 ? "W" : "",
3211                                   (data[8 + i] & (1 << 30)) != 0 ? "Z" : "",
3212                                   (data[8 + i] & (1 << 29)) != 0 ? "Y" : "",
3213                                   (data[8 + i] & (1 << 28)) != 0 ? "X" : "",
3214                                   (data[8 + i] >> 25) & 3,
3215                                   (data[8 + i] >> 22) & 3,
3216                                   (data[8 + i] >> 16) & 0x1f, j,
3217                                   (data[8 + i] & (1 << 15)) != 0 ? "W" : "",
3218                                   (data[8 + i] & (1 << 14)) != 0 ? "Z" : "",
3219                                   (data[8 + i] & (1 << 13)) != 0 ? "Y" : "",
3220                                   (data[8 + i] & (1 << 12)) != 0 ? "X" : "",
3221                                   (data[8 + i] >> 9) & 3,
3222                                   (data[8 + i] >> 6) & 3, (data[8 + i] & 0x1f));
3223                 instr_out(data, hw_offset, 16,
3224                           "Point Sprite TexCoord Enable\n");
3225                 instr_out(data, hw_offset, 17, "Const Interp Enable\n");
3226                 instr_out(data, hw_offset, 18,
3227                           "Attrib 7-0 WrapShortest Enable\n");
3228                 instr_out(data, hw_offset, 19,
3229                           "Attrib 15-8 WrapShortest Enable\n");
3230
3231                 return len;
3232
3233         case 0x7814:
3234                 len = (data[0] & 0xff) + 2;
3235                 if (len != 9)
3236                         fprintf(out, "Bad count in 3DSTATE_WM\n");
3237                 if (count < 9)
3238                         BUFFER_FAIL(count, len, "3DSTATE_WM");
3239                 instr_out(data, hw_offset, 0, "3DSTATE_WM\n");
3240                 instr_out(data, hw_offset, 1, "kernel start pointer 0\n");
3241                 instr_out(data, hw_offset, 2,
3242                           "SPF=%d, VME=%d, Sampler Count %d, "
3243                           "Binding table count %d\n", (data[2] >> 31) & 1,
3244                           (data[2] >> 30) & 1, (data[2] >> 27) & 7,
3245                           (data[2] >> 18) & 0xff);
3246                 instr_out(data, hw_offset, 3, "scratch offset\n");
3247                 instr_out(data, hw_offset, 4,
3248                           "Depth Clear %d, Depth Resolve %d, HiZ Resolve %d, "
3249                           "Dispatch GRF start[0] %d, start[1] %d, start[2] %d\n",
3250                           (data[4] & (1 << 30)) != 0,
3251                           (data[4] & (1 << 28)) != 0,
3252                           (data[4] & (1 << 27)) != 0, (data[4] >> 16) & 0x7f,
3253                           (data[4] >> 8) & 0x7f, (data[4] & 0x7f));
3254                 instr_out(data, hw_offset, 5,
3255                           "MaxThreads %d, PS KillPixel %d, PS computed Z %d, "
3256                           "PS use sourceZ %d, Thread Dispatch %d, PS use sourceW %d, Dispatch32 %d, "
3257                           "Dispatch16 %d, Dispatch8 %d\n",
3258                           ((data[5] >> 25) & 0x7f) + 1,
3259                           (data[5] & (1 << 22)) != 0,
3260                           (data[5] & (1 << 21)) != 0,
3261                           (data[5] & (1 << 20)) != 0,
3262                           (data[5] & (1 << 19)) != 0, (data[5] & (1 << 8)) != 0,
3263                           (data[5] & (1 << 2)) != 0, (data[5] & (1 << 1)) != 0,
3264                           (data[5] & (1 << 0)) != 0);
3265                 instr_out(data, hw_offset, 6,
3266                           "Num SF output %d, Pos XY offset %d, ZW interp mode %d , "
3267                           "Barycentric interp mode 0x%x, Point raster rule %d, Multisample mode %d, "
3268                           "Multisample Dispatch mode %d\n",
3269                           (data[6] >> 20) & 0x3f, (data[6] >> 18) & 3,
3270                           (data[6] >> 16) & 3, (data[6] >> 10) & 0x3f,
3271                           (data[6] & (1 << 9)) != 0, (data[6] >> 1) & 3,
3272                           (data[6] & 1));
3273                 instr_out(data, hw_offset, 7, "kernel start pointer 1\n");
3274                 instr_out(data, hw_offset, 8, "kernel start pointer 2\n");
3275
3276                 return len;
3277
3278         case 0x7900:
3279                 if (len != 4)
3280                         fprintf(out,
3281                                 "Bad count in 3DSTATE_DRAWING_RECTANGLE\n");
3282                 if (count < 4)
3283                         BUFFER_FAIL(count, len, "3DSTATE_DRAWING_RECTANGLE");
3284
3285                 instr_out(data, hw_offset, 0, "3DSTATE_DRAWING_RECTANGLE\n");
3286                 instr_out(data, hw_offset, 1, "top left: %d,%d\n",
3287                           data[1] & 0xffff, (data[1] >> 16) & 0xffff);
3288                 instr_out(data, hw_offset, 2, "bottom right: %d,%d\n",
3289                           data[2] & 0xffff, (data[2] >> 16) & 0xffff);
3290                 instr_out(data, hw_offset, 3, "origin: %d,%d\n",
3291                           (int)data[3] & 0xffff, ((int)data[3] >> 16) & 0xffff);
3292
3293                 return len;
3294
3295         case 0x7905:
3296                 if (len < 5 || len > 7)
3297                         fprintf(out, "Bad count in 3DSTATE_DEPTH_BUFFER\n");
3298                 if (count < len)
3299                         BUFFER_FAIL(count, len, "3DSTATE_DEPTH_BUFFER");
3300
3301                 instr_out(data, hw_offset, 0, "3DSTATE_DEPTH_BUFFER\n");
3302                 if (IS_GEN5(devid) || IS_GEN6(devid))
3303                         instr_out(data, hw_offset, 1,
3304                                   "%s, %s, pitch = %d bytes, %stiled, HiZ %d, Seperate Stencil %d\n",
3305                                   get_965_surfacetype(data[1] >> 29),
3306                                   get_965_depthformat((data[1] >> 18) & 0x7),
3307                                   (data[1] & 0x0001ffff) + 1,
3308                                   data[1] & (1 << 27) ? "" : "not ",
3309                                   (data[1] & (1 << 22)) != 0,
3310                                   (data[1] & (1 << 21)) != 0);
3311                 else
3312                         instr_out(data, hw_offset, 1,
3313                                   "%s, %s, pitch = %d bytes, %stiled\n",
3314                                   get_965_surfacetype(data[1] >> 29),
3315                                   get_965_depthformat((data[1] >> 18) & 0x7),
3316                                   (data[1] & 0x0001ffff) + 1,
3317                                   data[1] & (1 << 27) ? "" : "not ");
3318                 instr_out(data, hw_offset, 2, "depth offset\n");
3319                 instr_out(data, hw_offset, 3, "%dx%d\n",
3320                           ((data[3] & 0x0007ffc0) >> 6) + 1,
3321                           ((data[3] & 0xfff80000) >> 19) + 1);
3322                 instr_out(data, hw_offset, 4, "volume depth\n");
3323                 if (len >= 6)
3324                         instr_out(data, hw_offset, 5, "\n");
3325                 if (len >= 7) {
3326                         if (IS_GEN6(devid))
3327                                 instr_out(data, hw_offset, 6, "\n");
3328                         else
3329                                 instr_out(data, hw_offset, 6,
3330                                           "render target view extent\n");
3331                 }
3332
3333                 return len;
3334
3335         case 0x7a00:
3336                 if (IS_GEN6(devid) || IS_GEN7(devid)) {
3337                         unsigned int i;
3338                         len = (data[0] & 0xff) + 2;
3339                         if (len != 4 && len != 5)
3340                                 fprintf(out, "Bad count in PIPE_CONTROL\n");
3341                         if (count < len)
3342                                 BUFFER_FAIL(count, len, "PIPE_CONTROL");
3343
3344                         switch ((data[1] >> 14) & 0x3) {
3345                         case 0:
3346                                 desc1 = "no write";
3347                                 break;
3348                         case 1:
3349                                 desc1 = "qword write";
3350                                 break;
3351                         case 2:
3352                                 desc1 = "PS_DEPTH_COUNT write";
3353                                 break;
3354                         case 3:
3355                                 desc1 = "TIMESTAMP write";
3356                                 break;
3357                         }
3358                         instr_out(data, hw_offset, 0, "PIPE_CONTROL\n");
3359                         instr_out(data, hw_offset, 1,
3360                                   "%s, %s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s%s\n",
3361                                   desc1,
3362                                   data[1] & (1 << 20) ? "cs stall, " : "",
3363                                   data[1] & (1 << 19) ?
3364                                   "global snapshot count reset, " : "",
3365                                   data[1] & (1 << 18) ? "tlb invalidate, " : "",
3366                                   data[1] & (1 << 17) ? "gfdt flush, " : "",
3367                                   data[1] & (1 << 17) ? "media state clear, " :
3368                                   "",
3369                                   data[1] & (1 << 13) ? "depth stall, " : "",
3370                                   data[1] & (1 << 12) ?
3371                                   "render target cache flush, " : "",
3372                                   data[1] & (1 << 11) ?
3373                                   "instruction cache invalidate, " : "",
3374                                   data[1] & (1 << 10) ?
3375                                   "texture cache invalidate, " : "",
3376                                   data[1] & (1 << 9) ?
3377                                   "indirect state invalidate, " : "",
3378                                   data[1] & (1 << 8) ? "notify irq, " : "",
3379                                   data[1] & (1 << 7) ? "PIPE_CONTROL flush, " :
3380                                   "",
3381                                   data[1] & (1 << 6) ? "protect mem app_id, " :
3382                                   "", data[1] & (1 << 5) ? "DC flush, " : "",
3383                                   data[1] & (1 << 4) ? "vf fetch invalidate, " :
3384                                   "",
3385                                   data[1] & (1 << 3) ?
3386                                   "constant cache invalidate, " : "",
3387                                   data[1] & (1 << 2) ?
3388                                   "state cache invalidate, " : "",
3389                                   data[1] & (1 << 1) ? "stall at scoreboard, " :
3390                                   "",
3391                                   data[1] & (1 << 0) ? "depth cache flush, " :
3392                                   "");
3393                         if (len == 5) {
3394                                 instr_out(data, hw_offset, 2,
3395                                           "destination address\n");
3396                                 instr_out(data, hw_offset, 3,
3397                                           "immediate dword low\n");
3398                                 instr_out(data, hw_offset, 4,
3399                                           "immediate dword high\n");
3400                         } else {
3401                                 for (i = 2; i < len; i++) {
3402                                         instr_out(data, hw_offset, i, "\n");
3403                                 }
3404                         }
3405                         return len;
3406                 } else {
3407                         len = (data[0] & 0xff) + 2;
3408                         if (len != 4)
3409                                 fprintf(out, "Bad count in PIPE_CONTROL\n");
3410                         if (count < len)
3411                                 BUFFER_FAIL(count, len, "PIPE_CONTROL");
3412
3413                         switch ((data[0] >> 14) & 0x3) {
3414                         case 0:
3415                                 desc1 = "no write";
3416                                 break;
3417                         case 1:
3418                                 desc1 = "qword write";
3419                                 break;
3420                         case 2:
3421                                 desc1 = "PS_DEPTH_COUNT write";
3422                                 break;
3423                         case 3:
3424                                 desc1 = "TIMESTAMP write";
3425                                 break;
3426                         }
3427                         instr_out(data, hw_offset, 0,
3428                                   "PIPE_CONTROL: %s, %sdepth stall, %sRC write flush, "
3429                                   "%sinst flush\n",
3430                                   desc1,
3431                                   data[0] & (1 << 13) ? "" : "no ",
3432                                   data[0] & (1 << 12) ? "" : "no ",
3433                                   data[0] & (1 << 11) ? "" : "no ");
3434                         instr_out(data, hw_offset, 1, "destination address\n");
3435                         instr_out(data, hw_offset, 2, "immediate dword low\n");
3436                         instr_out(data, hw_offset, 3, "immediate dword high\n");
3437                         return len;
3438                 }
3439         case 0x7b00:
3440                 len = (data[0] & 0xff) + 2;
3441                 if (len != 6)
3442                         fprintf(out, "Bad count in 3DPRIMITIVE\n");
3443                 if (count < len)
3444                         BUFFER_FAIL(count, len, "3DPRIMITIVE");
3445
3446                 instr_out(data, hw_offset, 0,
3447                           "3DPRIMITIVE: %s %s\n",
3448                           get_965_prim_type(data[0]),
3449                           (data[0] & (1 << 15)) ? "random" : "sequential");
3450                 instr_out(data, hw_offset, 1, "vertex count\n");
3451                 instr_out(data, hw_offset, 2, "start vertex\n");
3452                 instr_out(data, hw_offset, 3, "instance count\n");
3453                 instr_out(data, hw_offset, 4, "start instance\n");
3454                 instr_out(data, hw_offset, 5, "index bias\n");
3455                 return len;
3456         }
3457
3458         for (idx = 0; idx < ARRAY_SIZE(opcodes_3d); idx++) {
3459                 opcode_3d = &opcodes_3d[idx];
3460                 if ((data[0] & 0xffff0000) >> 16 == opcode_3d->opcode) {
3461                         unsigned int i;
3462                         len = 1;
3463
3464                         instr_out(data, hw_offset, 0, "%s\n", opcode_3d->name);
3465                         if (opcode_3d->max_len > 1) {
3466                                 len = (data[0] & 0xff) + 2;
3467                                 if (len < opcode_3d->min_len ||
3468                                     len > opcode_3d->max_len) {
3469                                         fprintf(out, "Bad count in %s\n",
3470                                                 opcode_3d->name);
3471                                 }
3472                         }
3473
3474                         for (i = 1; i < len; i++) {
3475                                 if (i >= count)
3476                                         BUFFER_FAIL(count, len,
3477                                                     opcode_3d->name);
3478                                 instr_out(data, hw_offset, i, "dword %d\n", i);
3479                         }
3480                         return len;
3481                 }
3482         }
3483
3484         instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_965 opcode = 0x%x\n",
3485                   opcode);
3486         return 1;
3487 }
3488
3489 static int
3490 decode_3d_i830(struct drm_intel_decode *ctx)
3491 {
3492         unsigned int idx;
3493         uint32_t opcode;
3494         uint32_t *data = ctx->data;
3495         uint32_t hw_offset = ctx->hw_offset;
3496         uint32_t count = ctx->count;
3497
3498         struct {
3499                 uint32_t opcode;
3500                 unsigned int min_len;
3501                 unsigned int max_len;
3502                 const char *name;
3503         } opcodes_3d[] = {
3504                 { 0x02, 1, 1, "3DSTATE_MODES_3" },
3505                 { 0x03, 1, 1, "3DSTATE_ENABLES_1" },
3506                 { 0x04, 1, 1, "3DSTATE_ENABLES_2" },
3507                 { 0x05, 1, 1, "3DSTATE_VFT0" },
3508                 { 0x06, 1, 1, "3DSTATE_AA" },
3509                 { 0x07, 1, 1, "3DSTATE_RASTERIZATION_RULES" },
3510                 { 0x08, 1, 1, "3DSTATE_MODES_1" },
3511                 { 0x09, 1, 1, "3DSTATE_STENCIL_TEST" },
3512                 { 0x0a, 1, 1, "3DSTATE_VFT1" },
3513                 { 0x0b, 1, 1, "3DSTATE_INDPT_ALPHA_BLEND" },
3514                 { 0x0c, 1, 1, "3DSTATE_MODES_5" },
3515                 { 0x0d, 1, 1, "3DSTATE_MAP_BLEND_OP" },
3516                 { 0x0e, 1, 1, "3DSTATE_MAP_BLEND_ARG" },
3517                 { 0x0f, 1, 1, "3DSTATE_MODES_2" },
3518                 { 0x15, 1, 1, "3DSTATE_FOG_COLOR" },
3519                 { 0x16, 1, 1, "3DSTATE_MODES_4"},
3520         }, *opcode_3d;
3521
3522         opcode = (data[0] & 0x1f000000) >> 24;
3523
3524         switch (opcode) {
3525         case 0x1f:
3526                 return decode_3d_primitive(ctx);
3527         case 0x1d:
3528                 return decode_3d_1d(ctx);
3529         case 0x1c:
3530                 return decode_3d_1c(ctx);
3531         }
3532
3533         for (idx = 0; idx < ARRAY_SIZE(opcodes_3d); idx++) {
3534                 opcode_3d = &opcodes_3d[idx];
3535                 if ((data[0] & 0x1f000000) >> 24 == opcode_3d->opcode) {
3536                         unsigned int len = 1, i;
3537
3538                         instr_out(data, hw_offset, 0, "%s\n", opcode_3d->name);
3539                         if (opcode_3d->max_len > 1) {
3540                                 len = (data[0] & 0xff) + 2;
3541                                 if (len < opcode_3d->min_len ||
3542                                     len > opcode_3d->max_len) {
3543                                         fprintf(out, "Bad count in %s\n",
3544                                                 opcode_3d->name);
3545                                 }
3546                         }
3547
3548                         for (i = 1; i < len; i++) {
3549                                 if (i >= count)
3550                                         BUFFER_FAIL(count, len,
3551                                                     opcode_3d->name);
3552                                 instr_out(data, hw_offset, i, "dword %d\n", i);
3553                         }
3554                         return len;
3555                 }
3556         }
3557
3558         instr_out(data, hw_offset, 0, "3D UNKNOWN: 3d_i830 opcode = 0x%x\n",
3559                   opcode);
3560         return 1;
3561 }
3562
3563 struct drm_intel_decode *
3564 drm_intel_decode_context_alloc(uint32_t devid)
3565 {
3566         struct drm_intel_decode *ctx;
3567
3568         ctx = calloc(1, sizeof(struct drm_intel_decode));
3569         if (!ctx)
3570                 return NULL;
3571
3572         ctx->devid = devid;
3573         ctx->out = stdout;
3574
3575         return ctx;
3576 }
3577
3578 void
3579 drm_intel_decode_context_free(struct drm_intel_decode *ctx)
3580 {
3581         free(ctx);
3582 }
3583
3584 void
3585 drm_intel_decode_set_dump_past_end(struct drm_intel_decode *ctx,
3586                                    int dump_past_end)
3587 {
3588         ctx->dump_past_end = !!dump_past_end;
3589 }
3590
3591 void
3592 drm_intel_decode_set_batch_pointer(struct drm_intel_decode *ctx,
3593                                    void *data, uint32_t hw_offset, int count)
3594 {
3595         ctx->base_data = data;
3596         ctx->base_hw_offset = hw_offset;
3597         ctx->base_count = count;
3598 }
3599
3600 void
3601 drm_intel_decode_set_head_tail(struct drm_intel_decode *ctx,
3602                                uint32_t head, uint32_t tail)
3603 {
3604         ctx->head = head;
3605         ctx->tail = tail;
3606 }
3607
3608 void
3609 drm_intel_decode_set_output_file(struct drm_intel_decode *ctx,
3610                                  FILE *out)
3611 {
3612         ctx->out = out;
3613 }
3614
3615 /**
3616  * Decodes an i830-i915 batch buffer, writing the output to stdout.
3617  *
3618  * \param data batch buffer contents
3619  * \param count number of DWORDs to decode in the batch buffer
3620  * \param hw_offset hardware address for the buffer
3621  */
3622 void
3623 drm_intel_decode(struct drm_intel_decode *ctx)
3624 {
3625         int ret;
3626         unsigned int index = 0;
3627         uint32_t devid;
3628
3629         if (!ctx)
3630                 return;
3631
3632         ctx->data = ctx->base_data;
3633         ctx->hw_offset = ctx->base_hw_offset;
3634         ctx->count = ctx->base_count;
3635
3636         devid = ctx->devid;
3637         head_offset = ctx->head;
3638         tail_offset = ctx->tail;
3639         out = ctx->out;
3640
3641         saved_s2_set = 0;
3642         saved_s4_set = 1;
3643
3644         while (ctx->count > 0) {
3645                 index = 0;
3646
3647                 switch ((ctx->data[index] & 0xe0000000) >> 29) {
3648                 case 0x0:
3649                         ret = decode_mi(ctx);
3650
3651                         /* If MI_BATCHBUFFER_END happened, then dump
3652                          * the rest of the output in case we some day
3653                          * want it in debugging, but don't decode it
3654                          * since it'll just confuse in the common
3655                          * case.
3656                          */
3657                         if (ret == -1) {
3658                                 if (ctx->dump_past_end) {
3659                                         index++;
3660                                 } else {
3661                                         for (index = index + 1; index < ctx->count;
3662                                              index++) {
3663                                                 instr_out(ctx->data,
3664                                                           ctx->hw_offset,
3665                                                           index, "\n");
3666                                         }
3667                                 }
3668                         } else
3669                                 index += ret;
3670                         break;
3671                 case 0x2:
3672                         index += decode_2d(ctx);
3673                         break;
3674                 case 0x3:
3675                         if (IS_9XX(devid) && !IS_GEN3(devid)) {
3676                                 index +=
3677                                     decode_3d_965(ctx);
3678                         } else if (IS_GEN3(devid)) {
3679                                 index += decode_3d(ctx);
3680                         } else {
3681                                 index +=
3682                                     decode_3d_i830(ctx);
3683                         }
3684                         break;
3685                 default:
3686                         instr_out(ctx->data, ctx->hw_offset, index,
3687                                   "UNKNOWN\n");
3688                         index++;
3689                         break;
3690                 }
3691                 fflush(out);
3692
3693                 if (ctx->count < index)
3694                         break;
3695
3696                 ctx->count -= index;
3697                 ctx->data += index;
3698                 ctx->hw_offset += 4 * index;
3699         }
3700 }