/* * Copyright © 2022 Intel Corporation * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS * IN THE SOFTWARE. * * Capture the hanging application with INTEL_DEBUG=capture-all * * Turn the error state into a replay file with : * $ intel_error2hangdump error_state * * Replay with : * $ intel_hang_replay -d error_state.dmp */ #include #include #include #include #include #include #include #include #include #include #include #include "common/intel_gem.h" #include "common/i915/intel_gem.h" #include "common/intel_hang_dump.h" #include "compiler/elk/elk_disasm.h" #include "compiler/elk/elk_isa_info.h" #include "compiler/brw_disasm.h" #include "compiler/brw_isa_info.h" #include "dev/intel_device_info.h" #include "drm-uapi/i915_drm.h" #include "util/u_dynarray.h" #include "util/u_math.h" static uint32_t gem_create(int drm_fd, uint64_t size) { struct drm_i915_gem_create gem_create = { .size = size, }; int ret = intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_CREATE, &gem_create); if (ret != 0) { /* FIXME: What do we do if this fails? */ return 0; } return gem_create.handle; } static uint32_t gem_context_create(int drm_fd) { /* TODO: add additional information in the intel_hang_dump_block_exec & * intel_hang_dump_block_hw_image structures to specify the engine and use * the correct engine here. */ I915_DEFINE_CONTEXT_PARAM_ENGINES(engines_param, 1) = { }; struct drm_i915_gem_context_create_ext_setparam set_engines = { .param = { .param = I915_CONTEXT_PARAM_ENGINES, .value = (uintptr_t)&engines_param, .size = sizeof(engines_param), } }; struct drm_i915_gem_context_create_ext_setparam recoverable_param = { .param = { .param = I915_CONTEXT_PARAM_RECOVERABLE, .value = 0, }, }; struct drm_i915_gem_context_create_ext create = { .flags = I915_CONTEXT_CREATE_FLAGS_USE_EXTENSIONS, }; intel_i915_gem_add_ext(&create.extensions, I915_CONTEXT_CREATE_EXT_SETPARAM, &set_engines.base); intel_i915_gem_add_ext(&create.extensions, I915_CONTEXT_CREATE_EXT_SETPARAM, &recoverable_param.base); if (intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_CONTEXT_CREATE_EXT, &create) == -1) return false; return create.ctx_id; } static bool gem_context_set_hw_image(int drm_fd, uint32_t ctx_id, const void *hw_img_data, uint32_t img_size) { /* TODO: add additional information in the intel_hang_dump_block_exec & * intel_hang_dump_block_hw_image structures to specify the engine and use * the correct engine here. */ struct i915_gem_context_param_context_image img_param = { .engine = { .engine_class = 0, .engine_instance = 0, }, .flags = I915_CONTEXT_IMAGE_FLAG_ENGINE_INDEX, .size = img_size, .image = (uint64_t)(uintptr_t)hw_img_data, }; struct drm_i915_gem_context_param param = { .ctx_id = ctx_id, .param = I915_CONTEXT_PARAM_CONTEXT_IMAGE, }; uint64_t val = 0; int ret; param.ctx_id = ctx_id; param.param = I915_CONTEXT_PARAM_RECOVERABLE; param.value = (uint64_t)(uintptr_t)&val; ret = intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_CONTEXT_SETPARAM, ¶m); if (ret) return false; param.param = I915_CONTEXT_PARAM_CONTEXT_IMAGE; param.size = sizeof(img_param); param.value = (uint64_t)(uintptr_t)&img_param; return intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_CONTEXT_SETPARAM, ¶m) == 0; } static void* gem_mmap_offset(int drm_fd, uint32_t gem_handle, uint64_t offset, uint64_t size, uint32_t flags) { struct drm_i915_gem_mmap_offset gem_mmap = { .handle = gem_handle, .flags = I915_MMAP_OFFSET_WB, }; assert(offset == 0); /* Get the fake offset back */ int ret = intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_MMAP_OFFSET, &gem_mmap); if (ret != 0 && gem_mmap.flags == I915_MMAP_OFFSET_FIXED) { gem_mmap.flags = (flags & I915_MMAP_WC) ? I915_MMAP_OFFSET_WC : I915_MMAP_OFFSET_WB, ret = intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_MMAP_OFFSET, &gem_mmap); } if (ret != 0) return MAP_FAILED; /* And map it */ void *map = mmap(NULL, size, PROT_READ | PROT_WRITE, MAP_SHARED, drm_fd, gem_mmap.offset); return map; } static void write_malloc_data(void *out_data, int file_fd, size_t size) { size_t total_read_len = 0; ssize_t read_len; while (total_read_len < size && (read_len = read(file_fd, out_data + total_read_len, size - total_read_len)) > 0) { total_read_len += read_len; } assert(total_read_len == size); } static void write_gem_bo_data(int drm_fd, uint32_t gem_handle, int file_fd, size_t size) { void *map = gem_mmap_offset(drm_fd, gem_handle, 0, size, I915_MMAP_OFFSET_WB); assert(map != MAP_FAILED); size_t total_read_len = 0; ssize_t read_len; while (total_read_len < size && (read_len = read(file_fd, map + total_read_len, size - total_read_len)) > 0) { total_read_len += read_len; } munmap(map, size); assert(total_read_len == size); } static void skip_data(int file_fd, size_t size) { lseek(file_fd, size, SEEK_CUR); } static int get_drm_device(struct intel_device_info *devinfo) { drmDevicePtr devices[8]; int max_devices = drmGetDevices2(0, devices, 8); int i, fd = -1; for (i = 0; i < max_devices; i++) { if (devices[i]->available_nodes & 1 << DRM_NODE_RENDER && devices[i]->bustype == DRM_BUS_PCI && devices[i]->deviceinfo.pci->vendor_id == 0x8086) { fd = open(devices[i]->nodes[DRM_NODE_RENDER], O_RDWR | O_CLOEXEC); if (fd < 0) continue; if (!intel_get_device_info_from_fd(fd, devinfo, -1, -1) || devinfo->ver < 8) { close(fd); fd = -1; continue; } /* Found a device! */ break; } } return fd; } struct gem_bo { off_t file_offset; uint32_t gem_handle; uint64_t offset; uint64_t size; bool hw_img; }; static int compare_bos(const void *b1, const void *b2) { const struct gem_bo *gem_b1 = b1, *gem_b2 = b2; return gem_b2->size > gem_b1->size; } static void print_help(const char *filename, FILE *f) { fprintf(f, "%s: %s [options]...\n", filename, filename); fprintf(f, " -d, --dump FILE hang file to replay\n"); fprintf(f, " -l, --list list content of hang file (no replay)\n"); fprintf(f, " -s, --shader ADDR print shader at ADDR\n"); fprintf(f, " -h, --help print this screen\n"); fprintf(f, " -a, --address ADDR Find BO containing ADDR\n"); } static int execbuffer(int drm_fd, uint32_t context_id, struct util_dynarray *execbuffer_bos, struct gem_bo *exec_bo, uint64_t exec_offset) { struct drm_i915_gem_execbuffer2 execbuf = { .buffers_ptr = (uintptr_t)(void *)util_dynarray_begin(execbuffer_bos), .buffer_count = util_dynarray_num_elements(execbuffer_bos, struct drm_i915_gem_exec_object2), .batch_start_offset = exec_offset - exec_bo->offset, .batch_len = exec_bo->size, .flags = I915_EXEC_HANDLE_LUT, .rsvd1 = context_id, }; int ret = intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_EXECBUFFER2_WR, &execbuf); if (ret == 0) { struct drm_i915_gem_wait gem_wait = { .bo_handle = exec_bo->gem_handle, .timeout_ns = INT64_MAX, }; ret = intel_ioctl(drm_fd, DRM_IOCTL_I915_GEM_WAIT, &gem_wait); if (ret) fprintf(stderr, "wait failed: %m\n"); } else { fprintf(stderr, "execbuffer failed: %m\n"); } return ret; } int main(int argc, char *argv[]) { bool help = false, list = false; const struct option aubinator_opts[] = { { "address", required_argument, NULL, 'a' }, { "dump", required_argument, NULL, 'd' }, { "shader", required_argument, NULL, 's' }, { "list", no_argument, NULL, 'l' }, { "help", no_argument, NULL, 'h' }, { NULL, 0, NULL, 0 }, }; void *mem_ctx = ralloc_context(NULL); struct util_dynarray shader_addresses; util_dynarray_init(&shader_addresses, mem_ctx); const char *file = NULL; uint64_t check_addr = -1; int c, i; while ((c = getopt_long(argc, argv, "a:d:hls:", aubinator_opts, &i)) != -1) { switch (c) { case 'a': check_addr = strtol(optarg, NULL, 0); break; case 'd': file = optarg; break; case 's': { uint64_t *addr = util_dynarray_grow(&shader_addresses, uint64_t, 1); *addr = strtol(optarg, NULL, 0); fprintf(stderr, "shader addr=0x%016"PRIx64"\n", *addr); break; } case 'h': help = true; break; case 'l': list = true; break; default: break; } } if (help) { print_help(argv[0], stderr); exit(EXIT_SUCCESS); } int file_fd = open(file, O_RDONLY); if (file_fd < 0) exit(EXIT_FAILURE); struct stat file_stats; if (fstat(file_fd, &file_stats) != 0) exit(EXIT_FAILURE); struct intel_device_info devinfo; int drm_fd = get_drm_device(&devinfo); if (drm_fd < 0) exit(EXIT_FAILURE); struct util_dynarray buffers; uint64_t total_vma = 0; util_dynarray_init(&buffers, mem_ctx); union intel_hang_dump_block_all block_header; struct intel_hang_dump_block_exec init = { .offset = -1, }, exec = { .offset = -1, }; while (read(file_fd, &block_header.base, sizeof(block_header.base)) == sizeof(block_header.base)) { static const size_t block_size[] = { [INTEL_HANG_DUMP_BLOCK_TYPE_HEADER] = sizeof(struct intel_hang_dump_block_header), [INTEL_HANG_DUMP_BLOCK_TYPE_BO] = sizeof(struct intel_hang_dump_block_bo), [INTEL_HANG_DUMP_BLOCK_TYPE_MAP] = sizeof(struct intel_hang_dump_block_map), [INTEL_HANG_DUMP_BLOCK_TYPE_EXEC] = sizeof(struct intel_hang_dump_block_exec), [INTEL_HANG_DUMP_BLOCK_TYPE_HW_IMAGE] = sizeof(struct intel_hang_dump_block_hw_image), }; assert(block_header.base.type < ARRAY_SIZE(block_size)); size_t remaining_size = block_size[block_header.base.type] - sizeof(block_header.base); ssize_t ret = read(file_fd, &block_header.base + 1, remaining_size); bool has_hw_image = false; assert(ret == remaining_size); switch (block_header.base.type) { case INTEL_HANG_DUMP_BLOCK_TYPE_HEADER: assert(block_header.header.magic == INTEL_HANG_DUMP_MAGIC); assert(block_header.header.version == INTEL_HANG_DUMP_VERSION); break; case INTEL_HANG_DUMP_BLOCK_TYPE_BO: { struct gem_bo *bo = util_dynarray_grow(&buffers, struct gem_bo, 1); *bo = (struct gem_bo) { .file_offset = lseek(file_fd, 0, SEEK_CUR), .offset = block_header.bo.offset, .size = block_header.bo.size, }; total_vma += bo->size; skip_data(file_fd, bo->size); if (list) { fprintf(stderr, "buffer: offset=0x%016"PRIx64" size=0x%016"PRIx64" name=%s\n", bo->offset, bo->size, block_header.bo.name); } break; } case INTEL_HANG_DUMP_BLOCK_TYPE_HW_IMAGE: { struct gem_bo *bo = util_dynarray_grow(&buffers, struct gem_bo, 1); *bo = (struct gem_bo) { .file_offset = lseek(file_fd, 0, SEEK_CUR), .offset = 0, .size = block_header.hw_img.size, .hw_img = true, }; total_vma += bo->size; skip_data(file_fd, bo->size); if (list) { fprintf(stderr, "buffer: offset=0x%016"PRIx64" size=0x%016"PRIx64" name=hw_img\n", bo->offset, bo->size); } has_hw_image = true; break; } case INTEL_HANG_DUMP_BLOCK_TYPE_MAP: { struct gem_bo *bo = util_dynarray_grow(&buffers, struct gem_bo, 1); *bo = (struct gem_bo) { .file_offset = 0, .offset = block_header.map.offset, .size = block_header.map.size, }; total_vma += bo->size; if (list) { fprintf(stderr, "map : offset=0x%016"PRIx64" size=0x%016"PRIx64" name=%s\n", bo->offset, bo->size, block_header.map.name); } break; } case INTEL_HANG_DUMP_BLOCK_TYPE_EXEC: { if (init.offset == 0 && !has_hw_image) { if (list) fprintf(stderr, "init : offset=0x%016"PRIx64"\n", block_header.exec.offset); init = block_header.exec; } else { if (list) fprintf(stderr, "exec : offset=0x%016"PRIx64"\n", block_header.exec.offset); exec = block_header.exec; } break; } default: unreachable("Invalid block type"); } } fprintf(stderr, "total_vma: 0x%016"PRIx64"\n", total_vma); if (check_addr != -1) { struct gem_bo *check_bo = NULL; util_dynarray_foreach(&buffers, struct gem_bo, bo) { if (check_addr >= bo->offset && check_addr < (bo->offset + bo->size)) { check_bo = bo; break; } } if (check_bo) { fprintf(stderr, "address=0x%016"PRIx64" found in buffer 0x%016"PRIx64" size=0x%016"PRIx64"\n", check_addr, check_bo->offset, check_bo->size); } else { fprintf(stderr, "address=0x%016"PRIx64" not found in buffer list\n", check_addr); } } util_dynarray_foreach(&shader_addresses, uint64_t, addr) { bool found = false; util_dynarray_foreach(&buffers, struct gem_bo, bo) { if (*addr < bo->offset || *addr >= (bo->offset + bo->size)) continue; if (!bo->file_offset) break; uint64_t aligned_offset = ROUND_DOWN_TO(bo->file_offset, 4096); uint64_t remaining_length = file_stats.st_size - aligned_offset; void *map = mmap(NULL, remaining_length, PROT_READ, MAP_PRIVATE, file_fd, aligned_offset); if (map == MAP_FAILED) break; found = true; fprintf(stderr, "shader at 0x%016"PRIx64" file_offset=0%016"PRIx64" addr_offset=%016"PRIx64":\n", *addr, (bo->file_offset - aligned_offset), (*addr - bo->offset)); if (devinfo.ver >= 9) { struct brw_isa_info _isa, *isa = &_isa; brw_init_isa_info(isa, &devinfo); brw_disassemble_with_errors(isa, map + (bo->file_offset - aligned_offset) + (*addr - bo->offset), 0, stderr); } else { struct elk_isa_info _isa, *isa = &_isa; elk_init_isa_info(isa, &devinfo); elk_disassemble_with_errors(isa, map + (bo->file_offset - aligned_offset) + (*addr - bo->offset), 0, stderr); } munmap(map, remaining_length); } if (!found) fprintf(stderr, "shader at 0x%016"PRIx64" not found\n", *addr); } if (!list && util_dynarray_num_elements(&shader_addresses, uint64_t) == 0) { /* Sort buffers by size */ qsort(util_dynarray_begin(&buffers), util_dynarray_num_elements(&buffers, struct gem_bo), sizeof(struct gem_bo), compare_bos); void *hw_img = NULL; uint32_t hw_img_size = 0; /* Allocate BOs populate them */ uint64_t gem_allocated = 0; util_dynarray_foreach(&buffers, struct gem_bo, bo) { lseek(file_fd, bo->file_offset, SEEK_SET); if (bo->hw_img) { hw_img = malloc(bo->size); write_malloc_data(hw_img, file_fd, bo->size); hw_img_size = bo->size; } else { bo->gem_handle = gem_create(drm_fd, bo->size); write_gem_bo_data(drm_fd, bo->gem_handle, file_fd, bo->size); } gem_allocated += bo->size; } uint32_t ctx_id = gem_context_create(drm_fd); if (ctx_id == 0) { fprintf(stderr, "fail to create context: %s\n", strerror(errno)); return EXIT_FAILURE; } if (hw_img != NULL) { if (!gem_context_set_hw_image(drm_fd, ctx_id, hw_img, hw_img_size)) { fprintf(stderr, "fail to set context hw img: %s\n", strerror(errno)); return EXIT_FAILURE; } } struct util_dynarray execbuffer_bos; util_dynarray_init(&execbuffer_bos, mem_ctx); struct gem_bo *init_bo = NULL, *batch_bo = NULL; util_dynarray_foreach(&buffers, struct gem_bo, bo) { if (bo->offset <= init.offset && (bo->offset + bo->size) > init.offset) { init_bo = bo; continue; } if (bo->offset <= exec.offset && (bo->offset + bo->size) > exec.offset) { batch_bo = bo; continue; } if (bo->hw_img) continue; struct drm_i915_gem_exec_object2 *execbuf_bo = util_dynarray_grow(&execbuffer_bos, struct drm_i915_gem_exec_object2, 1); *execbuf_bo = (struct drm_i915_gem_exec_object2) { .handle = bo->gem_handle, .relocation_count = 0, .relocs_ptr = 0, .flags = EXEC_OBJECT_SUPPORTS_48B_ADDRESS | EXEC_OBJECT_PINNED | EXEC_OBJECT_CAPTURE, .offset = intel_canonical_address(bo->offset), }; } assert(batch_bo != NULL); struct drm_i915_gem_exec_object2 *execbuf_bo = util_dynarray_grow(&execbuffer_bos, struct drm_i915_gem_exec_object2, 1); int ret; if (init_bo) { fprintf(stderr, "init: 0x%016"PRIx64"\n", init_bo->offset); *execbuf_bo = (struct drm_i915_gem_exec_object2) { .handle = init_bo->gem_handle, .relocation_count = 0, .relocs_ptr = 0, .flags = EXEC_OBJECT_SUPPORTS_48B_ADDRESS | EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE /* to be able to wait on the BO */ | EXEC_OBJECT_CAPTURE, .offset = intel_canonical_address(init_bo->offset), }; ret = execbuffer(drm_fd, ctx_id, &execbuffer_bos, init_bo, init.offset); if (ret != 0) { fprintf(stderr, "initialization buffer failed to execute errno=%i\n", errno); exit(-1); } } else { fprintf(stderr, "no init BO\n"); } if (batch_bo) { fprintf(stderr, "exec: 0x%016"PRIx64" aperture=%.2fMb\n", batch_bo->offset, gem_allocated / 1024.0 / 1024.0); *execbuf_bo = (struct drm_i915_gem_exec_object2) { .handle = batch_bo->gem_handle, .relocation_count = 0, .relocs_ptr = 0, .flags = EXEC_OBJECT_SUPPORTS_48B_ADDRESS | EXEC_OBJECT_PINNED | EXEC_OBJECT_WRITE /* to be able to wait on the BO */ | EXEC_OBJECT_CAPTURE, .offset = intel_canonical_address(batch_bo->offset), }; ret = execbuffer(drm_fd, ctx_id, &execbuffer_bos, batch_bo, exec.offset); if (ret != 0) { fprintf(stderr, "replayed buffer failed to execute errno=%i\n", errno); exit(-1); } else { fprintf(stderr, "exec completed successfully\n"); } } else { fprintf(stderr, "no exec BO\n"); } } close(drm_fd); close(file_fd); ralloc_free(mem_ctx); return EXIT_SUCCESS; }