xref: /third_party/mesa3d/src/intel/tools/error2aub.c (revision bf215546)
1/*
2 * Copyright © 2018 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 *
23 */
24
25#include <assert.h>
26#include <getopt.h>
27#include <inttypes.h>
28#include <signal.h>
29#include <stdio.h>
30#include <stdlib.h>
31#include <string.h>
32#include <stdarg.h>
33#include <zlib.h>
34
35#include "util/list.h"
36
37#include "aub_write.h"
38#include "drm-uapi/i915_drm.h"
39#include "intel_aub.h"
40
41#define fail_if(cond, ...) _fail_if(cond, NULL, __VA_ARGS__)
42
43#define fail(...) fail_if(true, __VA_ARGS__)
44
45static int zlib_inflate(uint32_t **ptr, int len)
46{
47   struct z_stream_s zstream;
48   void *out;
49   const uint32_t out_size = 128*4096;  /* approximate obj size */
50
51   memset(&zstream, 0, sizeof(zstream));
52
53   zstream.next_in = (unsigned char *)*ptr;
54   zstream.avail_in = 4*len;
55
56   if (inflateInit(&zstream) != Z_OK)
57      return 0;
58
59   out = malloc(out_size);
60   zstream.next_out = out;
61   zstream.avail_out = out_size;
62
63   do {
64      switch (inflate(&zstream, Z_SYNC_FLUSH)) {
65      case Z_STREAM_END:
66         goto end;
67      case Z_OK:
68         break;
69      default:
70         inflateEnd(&zstream);
71         return 0;
72      }
73
74      if (zstream.avail_out)
75         break;
76
77      out = realloc(out, 2*zstream.total_out);
78      if (out == NULL) {
79         inflateEnd(&zstream);
80         return 0;
81      }
82
83      zstream.next_out = (unsigned char *)out + zstream.total_out;
84      zstream.avail_out = zstream.total_out;
85   } while (1);
86 end:
87   inflateEnd(&zstream);
88   free(*ptr);
89   *ptr = out;
90   return zstream.total_out / 4;
91}
92
93static int ascii85_decode(const char *in, uint32_t **out, bool inflate)
94{
95   int len = 0, size = 1024;
96
97   *out = realloc(*out, sizeof(uint32_t)*size);
98   if (*out == NULL)
99      return 0;
100
101   while (*in >= '!' && *in <= 'z') {
102      uint32_t v = 0;
103
104      if (len == size) {
105         size *= 2;
106         *out = realloc(*out, sizeof(uint32_t)*size);
107         if (*out == NULL)
108            return 0;
109      }
110
111      if (*in == 'z') {
112         in++;
113      } else {
114         v += in[0] - 33; v *= 85;
115         v += in[1] - 33; v *= 85;
116         v += in[2] - 33; v *= 85;
117         v += in[3] - 33; v *= 85;
118         v += in[4] - 33;
119         in += 5;
120      }
121      (*out)[len++] = v;
122   }
123
124   if (!inflate)
125      return len;
126
127   return zlib_inflate(out, len);
128}
129
130static void
131print_help(const char *progname, FILE *file)
132{
133   fprintf(file,
134           "Usage: %s [OPTION]... [FILE]\n"
135           "Convert an Intel GPU i915 error state to an aub file.\n"
136           "  -h, --help          display this help and exit\n"
137           "  -o, --output=FILE   the output aub file (default FILE.aub)\n",
138           progname);
139}
140
141struct bo {
142   enum address_space {
143      PPGTT,
144      GGTT,
145   } gtt;
146   enum bo_type {
147      BO_TYPE_UNKNOWN = 0,
148      BO_TYPE_BATCH,
149      BO_TYPE_USER,
150      BO_TYPE_CONTEXT,
151      BO_TYPE_RINGBUFFER,
152      BO_TYPE_STATUS,
153      BO_TYPE_CONTEXT_WA,
154   } type;
155   const char *name;
156   uint64_t addr;
157   uint8_t *data;
158   uint64_t size;
159
160   enum drm_i915_gem_engine_class engine_class;
161   int engine_instance;
162
163   struct list_head link;
164};
165
166static struct bo *
167find_or_create(struct list_head *bo_list, uint64_t addr,
168               enum address_space gtt,
169               enum drm_i915_gem_engine_class engine_class,
170               int engine_instance)
171{
172   list_for_each_entry(struct bo, bo_entry, bo_list, link) {
173      if (bo_entry->addr == addr &&
174          bo_entry->gtt == gtt &&
175          bo_entry->engine_class == engine_class &&
176          bo_entry->engine_instance == engine_instance)
177         return bo_entry;
178   }
179
180   struct bo *new_bo = calloc(1, sizeof(*new_bo));
181   new_bo->addr = addr;
182   new_bo->gtt = gtt;
183   new_bo->engine_class = engine_class;
184   new_bo->engine_instance = engine_instance;
185   list_addtail(&new_bo->link, bo_list);
186
187   return new_bo;
188}
189
190static void
191engine_from_name(const char *engine_name,
192                 enum drm_i915_gem_engine_class *engine_class,
193                 int *engine_instance)
194{
195   const struct {
196      const char *match;
197      enum drm_i915_gem_engine_class engine_class;
198      bool parse_instance;
199   } rings[] = {
200      { "rcs", I915_ENGINE_CLASS_RENDER, true },
201      { "vcs", I915_ENGINE_CLASS_VIDEO, true },
202      { "vecs", I915_ENGINE_CLASS_VIDEO_ENHANCE, true },
203      { "bcs", I915_ENGINE_CLASS_COPY, true },
204      { "global", I915_ENGINE_CLASS_INVALID, false },
205      { "render command stream", I915_ENGINE_CLASS_RENDER, false },
206      { "blt command stream", I915_ENGINE_CLASS_COPY, false },
207      { "bsd command stream", I915_ENGINE_CLASS_VIDEO, false },
208      { "vebox command stream", I915_ENGINE_CLASS_VIDEO_ENHANCE, false },
209      { NULL, I915_ENGINE_CLASS_INVALID },
210   }, *r;
211
212   for (r = rings; r->match; r++) {
213      if (strncasecmp(engine_name, r->match, strlen(r->match)) == 0) {
214         *engine_class = r->engine_class;
215         if (r->parse_instance)
216            *engine_instance = strtol(engine_name + strlen(r->match), NULL, 10);
217         else
218            *engine_instance = 0;
219         return;
220      }
221   }
222
223   fail("Unknown engine %s\n", engine_name);
224}
225
226int
227main(int argc, char *argv[])
228{
229   int i, c;
230   bool help = false, verbose = false;
231   char *out_filename = NULL, *in_filename = NULL;
232   const struct option aubinator_opts[] = {
233      { "help",       no_argument,       NULL,     'h' },
234      { "output",     required_argument, NULL,     'o' },
235      { "verbose",    no_argument,       NULL,     'v' },
236      { NULL,         0,                 NULL,     0 }
237   };
238
239   i = 0;
240   while ((c = getopt_long(argc, argv, "ho:v", aubinator_opts, &i)) != -1) {
241      switch (c) {
242      case 'h':
243         help = true;
244         break;
245      case 'o':
246         out_filename = strdup(optarg);
247         break;
248      case 'v':
249         verbose = true;
250         break;
251      default:
252         break;
253      }
254   }
255
256   if (optind < argc)
257      in_filename = argv[optind++];
258
259   if (help || argc == 1 || !in_filename) {
260      print_help(argv[0], stderr);
261      return in_filename ? EXIT_SUCCESS : EXIT_FAILURE;
262   }
263
264   if (out_filename == NULL) {
265      int out_filename_size = strlen(in_filename) + 5;
266      out_filename = malloc(out_filename_size);
267      snprintf(out_filename, out_filename_size, "%s.aub", in_filename);
268   }
269
270   FILE *err_file = fopen(in_filename, "r");
271   fail_if(!err_file, "Failed to open error file \"%s\": %m\n", in_filename);
272
273   FILE *aub_file = fopen(out_filename, "w");
274   fail_if(!aub_file, "Failed to open aub file \"%s\": %m\n", in_filename);
275
276   struct aub_file aub = {};
277
278   enum drm_i915_gem_engine_class active_engine_class = I915_ENGINE_CLASS_INVALID;
279   int active_engine_instance = -1;
280
281   enum address_space active_gtt = PPGTT;
282   enum address_space default_gtt = PPGTT;
283
284   struct {
285      struct {
286         uint32_t ring_buffer_head;
287         uint32_t ring_buffer_tail;
288      } instances[3];
289   } engines[I915_ENGINE_CLASS_VIDEO_ENHANCE + 1];
290   memset(engines, 0, sizeof(engines));
291
292   int num_ring_bos = 0;
293
294   struct list_head bo_list;
295   list_inithead(&bo_list);
296
297   struct bo *last_bo = NULL;
298
299   char *line = NULL;
300   size_t line_size;
301   while (getline(&line, &line_size, err_file) > 0) {
302      const char *pci_id_start = strstr(line, "PCI ID");
303      if (pci_id_start) {
304         int pci_id;
305         int matched = sscanf(line, "PCI ID: 0x%04x\n", &pci_id);
306         fail_if(!matched, "Invalid error state file!\n");
307
308         aub_file_init(&aub, aub_file,
309                       NULL, pci_id, "error_state");
310         if (verbose)
311            aub.verbose_log_file = stdout;
312         default_gtt = active_gtt = aub_use_execlists(&aub) ? PPGTT : GGTT;
313         continue;
314      }
315
316      if (strstr(line, " command stream:")) {
317         engine_from_name(line, &active_engine_class, &active_engine_instance);
318         continue;
319      }
320
321      if (sscanf(line, "  ring->head: 0x%x\n",
322                 &engines[
323                    active_engine_class].instances[
324                       active_engine_instance].ring_buffer_head) == 1) {
325         continue;
326      }
327
328      if (sscanf(line, "  ring->tail: 0x%x\n",
329                 &engines[
330                    active_engine_class].instances[
331                       active_engine_instance].ring_buffer_tail) == 1) {
332         continue;
333      }
334
335      const char *active_start = "Active (";
336      if (strncmp(line, active_start, strlen(active_start)) == 0) {
337         char *ring = line + strlen(active_start);
338
339         engine_from_name(ring, &active_engine_class, &active_engine_instance);
340         active_gtt = default_gtt;
341
342         char *count = strchr(ring, '[');
343         fail_if(!count || sscanf(count, "[%d]:", &num_ring_bos) < 1,
344                 "Failed to parse BO table header\n");
345         continue;
346      }
347
348      const char *global_start = "Pinned (global) [";
349      if (strncmp(line, global_start, strlen(global_start)) == 0) {
350         active_engine_class = I915_ENGINE_CLASS_INVALID;
351         active_engine_instance = -1;
352         active_gtt = GGTT;
353         continue;
354      }
355
356      if (num_ring_bos > 0) {
357         unsigned hi, lo, size;
358         if (sscanf(line, " %x_%x %d", &hi, &lo, &size) == 3) {
359            struct bo *bo_entry = find_or_create(&bo_list, ((uint64_t)hi) << 32 | lo,
360                                                 active_gtt,
361                                                 active_engine_class,
362                                                 active_engine_instance);
363            bo_entry->size = size;
364            num_ring_bos--;
365         } else {
366            fail("Not enough BO entries in the active table\n");
367         }
368         continue;
369      }
370
371      if (line[0] == ':' || line[0] == '~') {
372         if (!last_bo || last_bo->type == BO_TYPE_UNKNOWN)
373            continue;
374
375         int count = ascii85_decode(line+1, (uint32_t **) &last_bo->data, line[0] == ':');
376         fail_if(count == 0, "ASCII85 decode failed.\n");
377         last_bo->size = count * 4;
378         continue;
379      }
380
381      char *dashes = strstr(line, " --- ");
382      if (dashes) {
383         dashes += 5;
384
385         engine_from_name(line, &active_engine_class, &active_engine_instance);
386
387         uint32_t hi, lo;
388         char *bo_address_str = strchr(dashes, '=');
389         if (!bo_address_str || sscanf(bo_address_str, "= 0x%08x %08x\n", &hi, &lo) != 2)
390            continue;
391
392         const struct {
393            const char *match;
394            enum bo_type type;
395            enum address_space gtt;
396         } bo_types[] = {
397            { "gtt_offset", BO_TYPE_BATCH,      default_gtt },
398            { "user",       BO_TYPE_USER,       default_gtt },
399            { "HW context", BO_TYPE_CONTEXT,    GGTT },
400            { "ringbuffer", BO_TYPE_RINGBUFFER, GGTT },
401            { "HW Status",  BO_TYPE_STATUS,     GGTT },
402            { "WA context", BO_TYPE_CONTEXT_WA, GGTT },
403            { "unknown",    BO_TYPE_UNKNOWN,    GGTT },
404         }, *b;
405
406         for (b = bo_types; b->type != BO_TYPE_UNKNOWN; b++) {
407            if (strncasecmp(dashes, b->match, strlen(b->match)) == 0)
408               break;
409         }
410
411         last_bo = find_or_create(&bo_list, ((uint64_t) hi) << 32 | lo,
412                                  b->gtt,
413                                  active_engine_class, active_engine_instance);
414
415         /* The batch buffer will appear twice as gtt_offset and user. Only
416          * keep the batch type.
417          */
418         if (last_bo->type == BO_TYPE_UNKNOWN) {
419            last_bo->type = b->type;
420            last_bo->name = b->match;
421         }
422
423         continue;
424      }
425   }
426
427   if (verbose) {
428      fprintf(stdout, "BOs found:\n");
429      list_for_each_entry(struct bo, bo_entry, &bo_list, link) {
430         fprintf(stdout, "\t type=%i addr=0x%016" PRIx64 " size=%" PRIu64 "\n",
431                 bo_entry->type, bo_entry->addr, bo_entry->size);
432      }
433   }
434
435   /* Find the batch that trigger the hang */
436   struct bo *batch_bo = NULL;
437   list_for_each_entry(struct bo, bo_entry, &bo_list, link) {
438      if (bo_entry->type == BO_TYPE_BATCH) {
439         batch_bo = bo_entry;
440         break;
441      }
442   }
443   fail_if(!batch_bo, "Failed to find batch buffer.\n");
444
445   /* Add all the BOs to the aub file */
446   struct bo *hwsp_bo = NULL;
447   list_for_each_entry(struct bo, bo_entry, &bo_list, link) {
448      switch (bo_entry->type) {
449      case BO_TYPE_BATCH:
450         if (bo_entry->gtt == PPGTT) {
451            aub_map_ppgtt(&aub, bo_entry->addr, bo_entry->size);
452            aub_write_trace_block(&aub, AUB_TRACE_TYPE_BATCH,
453                                  bo_entry->data, bo_entry->size, bo_entry->addr);
454         } else
455            aub_write_ggtt(&aub, bo_entry->addr, bo_entry->size, bo_entry->data);
456         break;
457      case BO_TYPE_USER:
458         if (bo_entry->gtt == PPGTT) {
459            aub_map_ppgtt(&aub, bo_entry->addr, bo_entry->size);
460            aub_write_trace_block(&aub, AUB_TRACE_TYPE_NOTYPE,
461                                  bo_entry->data, bo_entry->size, bo_entry->addr);
462         } else
463            aub_write_ggtt(&aub, bo_entry->addr, bo_entry->size, bo_entry->data);
464         break;
465      case BO_TYPE_CONTEXT:
466         if (bo_entry->engine_class == batch_bo->engine_class &&
467             bo_entry->engine_instance == batch_bo->engine_instance &&
468             aub_use_execlists(&aub)) {
469            hwsp_bo = bo_entry;
470
471            uint32_t *context = (uint32_t *) (bo_entry->data + 4096 /* GuC */ + 4096 /* HWSP */);
472
473            if (context[1] == 0) {
474               fprintf(stderr,
475                       "Invalid context image data.\n"
476                       "This is likely a kernel issue : https://bugs.freedesktop.org/show_bug.cgi?id=107691\n");
477            }
478
479            /* Update the ring buffer at the last known location. */
480            context[5] = engines[bo_entry->engine_class].instances[bo_entry->engine_instance].ring_buffer_head;
481            context[7] = engines[bo_entry->engine_class].instances[bo_entry->engine_instance].ring_buffer_tail;
482            fprintf(stdout, "engine start=0x%x head/tail=0x%x/0x%x\n",
483                    context[9], context[5], context[7]);
484
485            /* The error state doesn't provide a dump of the page tables, so
486             * we have to provide our own, that's easy enough.
487             */
488            context[49] = aub.pml4.phys_addr >> 32;
489            context[51] = aub.pml4.phys_addr & 0xffffffff;
490
491            fprintf(stdout, "context dump:\n");
492            for (int i = 0; i < 60; i++) {
493               if (i % 4 == 0)
494                  fprintf(stdout, "\n 0x%08" PRIx64 ": ", bo_entry->addr + 8192 + i * 4);
495               fprintf(stdout, "0x%08x ", context[i]);
496            }
497            fprintf(stdout, "\n");
498
499         }
500         aub_write_ggtt(&aub, bo_entry->addr, bo_entry->size, bo_entry->data);
501         break;
502      case BO_TYPE_RINGBUFFER:
503      case BO_TYPE_STATUS:
504      case BO_TYPE_CONTEXT_WA:
505         aub_write_ggtt(&aub, bo_entry->addr, bo_entry->size, bo_entry->data);
506         break;
507      case BO_TYPE_UNKNOWN:
508         if (bo_entry->gtt == PPGTT) {
509            aub_map_ppgtt(&aub, bo_entry->addr, bo_entry->size);
510            if (bo_entry->data) {
511               aub_write_trace_block(&aub, AUB_TRACE_TYPE_NOTYPE,
512                                     bo_entry->data, bo_entry->size, bo_entry->addr);
513            }
514         } else {
515            if (bo_entry->size > 0) {
516               void *zero_data = calloc(1, bo_entry->size);
517               aub_write_ggtt(&aub, bo_entry->addr, bo_entry->size, zero_data);
518               free(zero_data);
519            }
520         }
521         break;
522      default:
523         break;
524      }
525   }
526
527   if (aub_use_execlists(&aub)) {
528      fail_if(!hwsp_bo, "Failed to find Context buffer.\n");
529      aub_write_context_execlists(&aub, hwsp_bo->addr + 4096 /* skip GuC page */, hwsp_bo->engine_class);
530   } else {
531      /* Use context id 0 -- if we are not using execlists it doesn't matter
532       * anyway
533       */
534      aub_write_exec(&aub, 0, batch_bo->addr, 0, I915_ENGINE_CLASS_RENDER);
535   }
536
537   /* Cleanup */
538   list_for_each_entry_safe(struct bo, bo_entry, &bo_list, link) {
539      list_del(&bo_entry->link);
540      free(bo_entry->data);
541      free(bo_entry);
542   }
543
544   free(out_filename);
545   free(line);
546   if(err_file) {
547      fclose(err_file);
548   }
549   if(aub.file) {
550      aub_file_finish(&aub);
551   } else if(aub_file) {
552      fclose(aub_file);
553   }
554   return EXIT_SUCCESS;
555}
556
557/* vim: set ts=8 sw=8 tw=0 cino=:0,(0 noet :*/
558