1 /*
2 * Copyright © 2014 Broadcom
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #include "util/u_math.h"
25 #include "util/u_prim.h"
26 #include "util/macros.h"
27 #include "vc4_context.h"
28
29 #define dump_VC4_PACKET_LINE_WIDTH dump_float
30 #define dump_VC4_PACKET_POINT_SIZE dump_float
31
32 static void
dump_float(void * cl,uint32_t offset,uint32_t hw_offset)33 dump_float(void *cl, uint32_t offset, uint32_t hw_offset)
34 {
35 void *f = cl + offset;
36
37 fprintf(stderr, "0x%08x 0x%08x: %f (0x%08x)\n",
38 offset, hw_offset, uif(*(uint32_t *)f), *(uint32_t *)f);
39 }
40
41 static void
dump_VC4_PACKET_BRANCH_TO_SUB_LIST(void * cl,uint32_t offset,uint32_t hw_offset)42 dump_VC4_PACKET_BRANCH_TO_SUB_LIST(void *cl, uint32_t offset, uint32_t hw_offset)
43 {
44 uint32_t *addr = cl + offset;
45
46 fprintf(stderr, "0x%08x 0x%08x: addr 0x%08x\n",
47 offset, hw_offset, *addr);
48 }
49
50 static void
dump_loadstore_full(void * cl,uint32_t offset,uint32_t hw_offset)51 dump_loadstore_full(void *cl, uint32_t offset, uint32_t hw_offset)
52 {
53 uint32_t bits = *(uint32_t *)(cl + offset);
54
55 fprintf(stderr, "0x%08x 0x%08x: addr 0x%08x%s%s%s%s\n",
56 offset, hw_offset,
57 bits & ~0xf,
58 (bits & VC4_LOADSTORE_FULL_RES_DISABLE_CLEAR_ALL) ? "" : " clear",
59 (bits & VC4_LOADSTORE_FULL_RES_DISABLE_ZS) ? "" : " zs",
60 (bits & VC4_LOADSTORE_FULL_RES_DISABLE_COLOR) ? "" : " color",
61 (bits & VC4_LOADSTORE_FULL_RES_EOF) ? " eof" : "");
62 }
63
64 static void
dump_VC4_PACKET_LOAD_FULL_RES_TILE_BUFFER(void * cl,uint32_t offset,uint32_t hw_offset)65 dump_VC4_PACKET_LOAD_FULL_RES_TILE_BUFFER(void *cl, uint32_t offset, uint32_t hw_offset)
66 {
67 dump_loadstore_full(cl, offset, hw_offset);
68 }
69
70 static void
dump_VC4_PACKET_STORE_FULL_RES_TILE_BUFFER(void * cl,uint32_t offset,uint32_t hw_offset)71 dump_VC4_PACKET_STORE_FULL_RES_TILE_BUFFER(void *cl, uint32_t offset, uint32_t hw_offset)
72 {
73 dump_loadstore_full(cl, offset, hw_offset);
74 }
75
76 static void
dump_loadstore_general(void * cl,uint32_t offset,uint32_t hw_offset)77 dump_loadstore_general(void *cl, uint32_t offset, uint32_t hw_offset)
78 {
79 uint8_t *bytes = cl + offset;
80 uint32_t *addr = cl + offset + 2;
81
82 const char *fullvg = "";
83 const char *fullzs = "";
84 const char *fullcolor = "";
85 const char *buffer = "???";
86
87 switch ((bytes[0] & 0x7)){
88 case 0:
89 buffer = "none";
90 break;
91 case 1:
92 buffer = "color";
93 break;
94 case 2:
95 buffer = "zs";
96 break;
97 case 3:
98 buffer = "z";
99 break;
100 case 4:
101 buffer = "vgmask";
102 break;
103 case 5:
104 buffer = "full";
105 if (*addr & (1 << 0))
106 fullcolor = " !color";
107 if (*addr & (1 << 1))
108 fullzs = " !zs";
109 if (*addr & (1 << 2))
110 fullvg = " !vgmask";
111 break;
112 }
113
114 const char *tiling = "???";
115 switch ((bytes[0] >> 4) & 7) {
116 case 0:
117 tiling = "linear";
118 break;
119 case 1:
120 tiling = "T";
121 break;
122 case 2:
123 tiling = "LT";
124 break;
125 }
126
127 const char *format = "???";
128 switch (bytes[1] & 3) {
129 case 0:
130 format = "RGBA8888";
131 break;
132 case 1:
133 format = "BGR565_DITHER";
134 break;
135 case 2:
136 format = "BGR565";
137 break;
138 }
139
140 fprintf(stderr, "0x%08x 0x%08x: 0x%02x %s %s\n",
141 offset + 0, hw_offset + 0, bytes[0],
142 buffer, tiling);
143
144 fprintf(stderr, "0x%08x 0x%08x: 0x%02x %s\n",
145 offset + 1, hw_offset + 1, bytes[1],
146 format);
147
148 fprintf(stderr, "0x%08x 0x%08x: addr 0x%08x %s%s%s%s\n",
149 offset + 2, hw_offset + 2, *addr & ~15,
150 fullcolor, fullzs, fullvg,
151 (*addr & (1 << 3)) ? " EOF" : "");
152 }
153
154 static void
dump_VC4_PACKET_STORE_TILE_BUFFER_GENERAL(void * cl,uint32_t offset,uint32_t hw_offset)155 dump_VC4_PACKET_STORE_TILE_BUFFER_GENERAL(void *cl, uint32_t offset, uint32_t hw_offset)
156 {
157 dump_loadstore_general(cl, offset, hw_offset);
158 }
159
160 static void
dump_VC4_PACKET_LOAD_TILE_BUFFER_GENERAL(void * cl,uint32_t offset,uint32_t hw_offset)161 dump_VC4_PACKET_LOAD_TILE_BUFFER_GENERAL(void *cl, uint32_t offset, uint32_t hw_offset)
162 {
163 dump_loadstore_general(cl, offset, hw_offset);
164 }
165
166 static void
dump_VC4_PACKET_GL_INDEXED_PRIMITIVE(void * cl,uint32_t offset,uint32_t hw_offset)167 dump_VC4_PACKET_GL_INDEXED_PRIMITIVE(void *cl, uint32_t offset, uint32_t hw_offset)
168 {
169 uint8_t *b = cl + offset;
170 uint32_t *count = cl + offset + 1;
171 uint32_t *ib_offset = cl + offset + 5;
172 uint32_t *max_index = cl + offset + 9;
173
174 fprintf(stderr, "0x%08x 0x%08x: 0x%02x %s %s\n",
175 offset, hw_offset,
176 b[0], (b[0] & VC4_INDEX_BUFFER_U16) ? "16-bit" : "8-bit",
177 u_prim_name(b[0] & 0x7));
178 fprintf(stderr, "0x%08x 0x%08x: %d verts\n",
179 offset + 1, hw_offset + 1, *count);
180 fprintf(stderr, "0x%08x 0x%08x: 0x%08x IB offset\n",
181 offset + 5, hw_offset + 5, *ib_offset);
182 fprintf(stderr, "0x%08x 0x%08x: 0x%08x max index\n",
183 offset + 9, hw_offset + 9, *max_index);
184 }
185
186 static void
dump_VC4_PACKET_GL_ARRAY_PRIMITIVE(void * cl,uint32_t offset,uint32_t hw_offset)187 dump_VC4_PACKET_GL_ARRAY_PRIMITIVE(void *cl, uint32_t offset, uint32_t hw_offset)
188 {
189 uint8_t *b = cl + offset;
190 uint32_t *count = cl + offset + 1;
191 uint32_t *start = cl + offset + 5;
192
193 fprintf(stderr, "0x%08x 0x%08x: 0x%02x %s\n",
194 offset, hw_offset, b[0], u_prim_name(b[0] & 0x7));
195 fprintf(stderr, "0x%08x 0x%08x: %d verts\n",
196 offset + 1, hw_offset + 1, *count);
197 fprintf(stderr, "0x%08x 0x%08x: 0x%08x start\n",
198 offset + 5, hw_offset + 5, *start);
199 }
200
201 static void
dump_VC4_PACKET_FLAT_SHADE_FLAGS(void * cl,uint32_t offset,uint32_t hw_offset)202 dump_VC4_PACKET_FLAT_SHADE_FLAGS(void *cl, uint32_t offset, uint32_t hw_offset)
203 {
204 uint32_t *bits = cl + offset;
205
206 fprintf(stderr, "0x%08x 0x%08x: bits 0x%08x\n",
207 offset, hw_offset, *bits);
208 }
209
210 static void
dump_VC4_PACKET_VIEWPORT_OFFSET(void * cl,uint32_t offset,uint32_t hw_offset)211 dump_VC4_PACKET_VIEWPORT_OFFSET(void *cl, uint32_t offset, uint32_t hw_offset)
212 {
213 uint16_t *o = cl + offset;
214
215 fprintf(stderr, "0x%08x 0x%08x: %f, %f (0x%04x, 0x%04x)\n",
216 offset, hw_offset,
217 o[0] / 16.0, o[1] / 16.0,
218 o[0], o[1]);
219 }
220
221 static void
dump_VC4_PACKET_CLIPPER_XY_SCALING(void * cl,uint32_t offset,uint32_t hw_offset)222 dump_VC4_PACKET_CLIPPER_XY_SCALING(void *cl, uint32_t offset, uint32_t hw_offset)
223 {
224 uint32_t *scale = cl + offset;
225
226 fprintf(stderr, "0x%08x 0x%08x: %f, %f (%f, %f, 0x%08x, 0x%08x)\n",
227 offset, hw_offset,
228 uif(scale[0]) / 16.0, uif(scale[1]) / 16.0,
229 uif(scale[0]), uif(scale[1]),
230 scale[0], scale[1]);
231 }
232
233 static void
dump_VC4_PACKET_CLIPPER_Z_SCALING(void * cl,uint32_t offset,uint32_t hw_offset)234 dump_VC4_PACKET_CLIPPER_Z_SCALING(void *cl, uint32_t offset, uint32_t hw_offset)
235 {
236 uint32_t *translate = cl + offset;
237 uint32_t *scale = cl + offset + 8;
238
239 fprintf(stderr, "0x%08x 0x%08x: %f, %f (0x%08x, 0x%08x)\n",
240 offset, hw_offset,
241 uif(translate[0]), uif(translate[1]),
242 translate[0], translate[1]);
243
244 fprintf(stderr, "0x%08x 0x%08x: %f, %f (0x%08x, 0x%08x)\n",
245 offset + 8, hw_offset + 8,
246 uif(scale[0]), uif(scale[1]),
247 scale[0], scale[1]);
248 }
249
250 static void
dump_VC4_PACKET_TILE_BINNING_MODE_CONFIG(void * cl,uint32_t offset,uint32_t hw_offset)251 dump_VC4_PACKET_TILE_BINNING_MODE_CONFIG(void *cl, uint32_t offset, uint32_t hw_offset)
252 {
253 uint32_t *tile_alloc_addr = cl + offset;
254 uint32_t *tile_alloc_size = cl + offset + 4;
255 uint32_t *tile_state_addr = cl + offset + 8;
256 uint8_t *bin_x = cl + offset + 12;
257 uint8_t *bin_y = cl + offset + 13;
258 uint8_t *flags = cl + offset + 14;
259
260 fprintf(stderr, "0x%08x 0x%08x: tile alloc addr 0x%08x\n",
261 offset, hw_offset,
262 *tile_alloc_addr);
263
264 fprintf(stderr, "0x%08x 0x%08x: tile alloc size %db\n",
265 offset + 4, hw_offset + 4,
266 *tile_alloc_size);
267
268 fprintf(stderr, "0x%08x 0x%08x: tile state addr 0x%08x\n",
269 offset + 8, hw_offset + 8,
270 *tile_state_addr);
271
272 fprintf(stderr, "0x%08x 0x%08x: tiles (%d, %d)\n",
273 offset + 12, hw_offset + 12,
274 *bin_x, *bin_y);
275
276 fprintf(stderr, "0x%08x 0x%08x: flags 0x%02x\n",
277 offset + 14, hw_offset + 14,
278 *flags);
279 }
280
281 static void
dump_VC4_PACKET_TILE_RENDERING_MODE_CONFIG(void * cl,uint32_t offset,uint32_t hw_offset)282 dump_VC4_PACKET_TILE_RENDERING_MODE_CONFIG(void *cl, uint32_t offset, uint32_t hw_offset)
283 {
284 uint32_t *render_offset = cl + offset;
285 uint16_t *shorts = cl + offset + 4;
286 uint8_t *bytes = cl + offset + 8;
287
288 fprintf(stderr, "0x%08x 0x%08x: color offset 0x%08x\n",
289 offset, hw_offset,
290 *render_offset);
291
292 fprintf(stderr, "0x%08x 0x%08x: width %d\n",
293 offset + 4, hw_offset + 4,
294 shorts[0]);
295
296 fprintf(stderr, "0x%08x 0x%08x: height %d\n",
297 offset + 6, hw_offset + 6,
298 shorts[1]);
299
300 const char *format = "???";
301 switch (VC4_GET_FIELD(shorts[2], VC4_RENDER_CONFIG_FORMAT)) {
302 case VC4_RENDER_CONFIG_FORMAT_BGR565_DITHERED:
303 format = "BGR565_DITHERED";
304 break;
305 case VC4_RENDER_CONFIG_FORMAT_RGBA8888:
306 format = "RGBA8888";
307 break;
308 case VC4_RENDER_CONFIG_FORMAT_BGR565:
309 format = "BGR565";
310 break;
311 }
312 if (shorts[2] & VC4_RENDER_CONFIG_TILE_BUFFER_64BIT)
313 format = "64bit";
314
315 const char *tiling = "???";
316 switch (VC4_GET_FIELD(shorts[2], VC4_RENDER_CONFIG_MEMORY_FORMAT)) {
317 case VC4_TILING_FORMAT_LINEAR:
318 tiling = "linear";
319 break;
320 case VC4_TILING_FORMAT_T:
321 tiling = "T";
322 break;
323 case VC4_TILING_FORMAT_LT:
324 tiling = "LT";
325 break;
326 }
327
328 fprintf(stderr, "0x%08x 0x%08x: 0x%02x %s %s %s %s\n",
329 offset + 8, hw_offset + 8,
330 bytes[0],
331 format, tiling,
332 (shorts[2] & VC4_RENDER_CONFIG_MS_MODE_4X) ? "ms" : "ss",
333 (shorts[2] & VC4_RENDER_CONFIG_DECIMATE_MODE_4X) ?
334 "ms_decimate" : "ss_decimate");
335
336 const char *earlyz = "";
337 if (shorts[2] & VC4_RENDER_CONFIG_EARLY_Z_COVERAGE_DISABLE) {
338 earlyz = "early_z disabled";
339 } else {
340 if (shorts[2] & VC4_RENDER_CONFIG_EARLY_Z_DIRECTION_G)
341 earlyz = "early_z >";
342 else
343 earlyz = "early_z <";
344 }
345
346 fprintf(stderr, "0x%08x 0x%08x: 0x%02x %s\n",
347 offset + 9, hw_offset + 9,
348 bytes[1],
349 earlyz);
350 }
351
352 static void
dump_VC4_PACKET_TILE_COORDINATES(void * cl,uint32_t offset,uint32_t hw_offset)353 dump_VC4_PACKET_TILE_COORDINATES(void *cl, uint32_t offset, uint32_t hw_offset)
354 {
355 uint8_t *tilecoords = cl + offset;
356
357 fprintf(stderr, "0x%08x 0x%08x: %d, %d\n",
358 offset, hw_offset, tilecoords[0], tilecoords[1]);
359 }
360
361 static void
dump_VC4_PACKET_GEM_HANDLES(void * cl,uint32_t offset,uint32_t hw_offset)362 dump_VC4_PACKET_GEM_HANDLES(void *cl, uint32_t offset, uint32_t hw_offset)
363 {
364 uint32_t *handles = cl + offset;
365
366 fprintf(stderr, "0x%08x 0x%08x: handle 0: %d, handle 1: %d\n",
367 offset, hw_offset, handles[0], handles[1]);
368 }
369
370 #define PACKET_DUMP(name) [name] = { #name, name ## _SIZE, dump_##name }
371 #define PACKET(name) [name] = { #name, name ## _SIZE, NULL }
372
373 static const struct packet_info {
374 const char *name;
375 uint8_t size;
376 void (*dump_func)(void *cl, uint32_t offset, uint32_t hw_offset);
377 } packet_info[] = {
378 PACKET(VC4_PACKET_HALT),
379 PACKET(VC4_PACKET_NOP),
380
381 PACKET(VC4_PACKET_FLUSH),
382 PACKET(VC4_PACKET_FLUSH_ALL),
383 PACKET(VC4_PACKET_START_TILE_BINNING),
384 PACKET(VC4_PACKET_INCREMENT_SEMAPHORE),
385 PACKET(VC4_PACKET_WAIT_ON_SEMAPHORE),
386
387 PACKET(VC4_PACKET_BRANCH),
388 PACKET_DUMP(VC4_PACKET_BRANCH_TO_SUB_LIST),
389
390 PACKET(VC4_PACKET_STORE_MS_TILE_BUFFER),
391 PACKET(VC4_PACKET_STORE_MS_TILE_BUFFER_AND_EOF),
392 PACKET_DUMP(VC4_PACKET_STORE_FULL_RES_TILE_BUFFER),
393 PACKET_DUMP(VC4_PACKET_LOAD_FULL_RES_TILE_BUFFER),
394 PACKET_DUMP(VC4_PACKET_STORE_TILE_BUFFER_GENERAL),
395 PACKET_DUMP(VC4_PACKET_LOAD_TILE_BUFFER_GENERAL),
396
397 PACKET_DUMP(VC4_PACKET_GL_INDEXED_PRIMITIVE),
398 PACKET_DUMP(VC4_PACKET_GL_ARRAY_PRIMITIVE),
399
400 PACKET(VC4_PACKET_COMPRESSED_PRIMITIVE),
401 PACKET(VC4_PACKET_CLIPPED_COMPRESSED_PRIMITIVE),
402
403 PACKET(VC4_PACKET_PRIMITIVE_LIST_FORMAT),
404
405 PACKET(VC4_PACKET_GL_SHADER_STATE),
406 PACKET(VC4_PACKET_NV_SHADER_STATE),
407 PACKET(VC4_PACKET_VG_SHADER_STATE),
408
409 PACKET(VC4_PACKET_CONFIGURATION_BITS),
410 PACKET_DUMP(VC4_PACKET_FLAT_SHADE_FLAGS),
411 PACKET_DUMP(VC4_PACKET_POINT_SIZE),
412 PACKET_DUMP(VC4_PACKET_LINE_WIDTH),
413 PACKET(VC4_PACKET_RHT_X_BOUNDARY),
414 PACKET(VC4_PACKET_DEPTH_OFFSET),
415 PACKET(VC4_PACKET_CLIP_WINDOW),
416 PACKET_DUMP(VC4_PACKET_VIEWPORT_OFFSET),
417 PACKET(VC4_PACKET_Z_CLIPPING),
418 PACKET_DUMP(VC4_PACKET_CLIPPER_XY_SCALING),
419 PACKET_DUMP(VC4_PACKET_CLIPPER_Z_SCALING),
420
421 PACKET_DUMP(VC4_PACKET_TILE_BINNING_MODE_CONFIG),
422 PACKET_DUMP(VC4_PACKET_TILE_RENDERING_MODE_CONFIG),
423 PACKET(VC4_PACKET_CLEAR_COLORS),
424 PACKET_DUMP(VC4_PACKET_TILE_COORDINATES),
425
426 PACKET_DUMP(VC4_PACKET_GEM_HANDLES),
427 };
428
429 void
vc4_dump_cl(void * cl,uint32_t size,bool is_render)430 vc4_dump_cl(void *cl, uint32_t size, bool is_render)
431 {
432 uint32_t offset = 0, hw_offset = 0;
433 uint8_t *cmds = cl;
434
435 while (offset < size) {
436 uint8_t header = cmds[offset];
437
438 if (header >= ARRAY_SIZE(packet_info) ||
439 !packet_info[header].name) {
440 fprintf(stderr, "0x%08x 0x%08x: Unknown packet 0x%02x (%d)!\n",
441 offset, hw_offset, header, header);
442 return;
443 }
444
445 const struct packet_info *p = packet_info + header;
446 fprintf(stderr, "0x%08x 0x%08x: 0x%02x %s\n",
447 offset,
448 header != VC4_PACKET_GEM_HANDLES ? hw_offset : 0,
449 header, p->name);
450
451 if (offset + p->size <= size &&
452 p->dump_func) {
453 p->dump_func(cmds, offset + 1, hw_offset + 1);
454 } else {
455 for (uint32_t i = 1; i < p->size; i++) {
456 if (offset + i >= size) {
457 fprintf(stderr, "0x%08x 0x%08x: CL overflow!\n",
458 offset + i, hw_offset + i);
459 return;
460 }
461 fprintf(stderr, "0x%08x 0x%08x: 0x%02x\n",
462 offset + i,
463 header != VC4_PACKET_GEM_HANDLES ? hw_offset + i : 0,
464 cmds[offset + i]);
465 }
466 }
467
468 switch (header) {
469 case VC4_PACKET_HALT:
470 case VC4_PACKET_STORE_MS_TILE_BUFFER_AND_EOF:
471 return;
472 default:
473 break;
474 }
475
476 offset += p->size;
477 if (header != VC4_PACKET_GEM_HANDLES)
478 hw_offset += p->size;
479 }
480 }
481
482