1*9a0e4156SSadaf Ebrahimi#!/usr/bin/env python 2*9a0e4156SSadaf Ebrahimi 3*9a0e4156SSadaf Ebrahimi# Capstone Python bindings, by Nguyen Anh Quynnh <[email protected]> 4*9a0e4156SSadaf Ebrahimi 5*9a0e4156SSadaf Ebrahimifrom __future__ import print_function 6*9a0e4156SSadaf Ebrahimifrom capstone import * 7*9a0e4156SSadaf Ebrahimifrom capstone.arm import * 8*9a0e4156SSadaf Ebrahimifrom xprint import to_hex, to_x_32 9*9a0e4156SSadaf Ebrahimi 10*9a0e4156SSadaf Ebrahimi 11*9a0e4156SSadaf EbrahimiARM_CODE = b"\x86\x48\x60\xf4\xED\xFF\xFF\xEB\x04\xe0\x2d\xe5\x00\x00\x00\x00\xe0\x83\x22\xe5\xf1\x02\x03\x0e\x00\x00\xa0\xe3\x02\x30\xc1\xe7\x00\x00\x53\xe3\x00\x02\x01\xf1\x05\x40\xd0\xe8\xf4\x80\x00\x00" 12*9a0e4156SSadaf EbrahimiARM_CODE2 = b"\xd1\xe8\x00\xf0\xf0\x24\x04\x07\x1f\x3c\xf2\xc0\x00\x00\x4f\xf0\x00\x01\x46\x6c" 13*9a0e4156SSadaf EbrahimiTHUMB_CODE = b"\x70\x47\x00\xf0\x10\xe8\xeb\x46\x83\xb0\xc9\x68\x1f\xb1\x30\xbf\xaf\xf3\x20\x84\x52\xf8\x23\xf0" 14*9a0e4156SSadaf EbrahimiTHUMB_CODE2 = b"\x4f\xf0\x00\x01\xbd\xe8\x00\x88\xd1\xe8\x00\xf0\x18\xbf\xad\xbf\xf3\xff\x0b\x0c\x86\xf3\x00\x89\x80\xf3\x00\x8c\x4f\xfa\x99\xf6\xd0\xff\xa2\x01" 15*9a0e4156SSadaf EbrahimiTHUMB_MCLASS = b"\xef\xf3\x02\x80" 16*9a0e4156SSadaf EbrahimiARMV8 = b"\xe0\x3b\xb2\xee\x42\x00\x01\xe1\x51\xf0\x7f\xf5" 17*9a0e4156SSadaf Ebrahimi 18*9a0e4156SSadaf Ebrahimiall_tests = ( 19*9a0e4156SSadaf Ebrahimi (CS_ARCH_ARM, CS_MODE_ARM, ARM_CODE, "ARM", None), 20*9a0e4156SSadaf Ebrahimi (CS_ARCH_ARM, CS_MODE_THUMB, THUMB_CODE, "Thumb", None), 21*9a0e4156SSadaf Ebrahimi (CS_ARCH_ARM, CS_MODE_THUMB, ARM_CODE2, "Thumb-mixed", None), 22*9a0e4156SSadaf Ebrahimi (CS_ARCH_ARM, CS_MODE_THUMB, THUMB_CODE2, "Thumb-2 & register named with numbers", CS_OPT_SYNTAX_NOREGNAME), 23*9a0e4156SSadaf Ebrahimi (CS_ARCH_ARM, CS_MODE_THUMB + CS_MODE_MCLASS, THUMB_MCLASS, "Thumb-MClass", None), 24*9a0e4156SSadaf Ebrahimi (CS_ARCH_ARM, CS_MODE_ARM + CS_MODE_V8, ARMV8, "Arm-V8", None), 25*9a0e4156SSadaf Ebrahimi ) 26*9a0e4156SSadaf Ebrahimi 27*9a0e4156SSadaf Ebrahimi 28*9a0e4156SSadaf Ebrahimidef print_insn_detail(insn): 29*9a0e4156SSadaf Ebrahimi # print address, mnemonic and operands 30*9a0e4156SSadaf Ebrahimi print("0x%x:\t%s\t%s" % (insn.address, insn.mnemonic, insn.op_str)) 31*9a0e4156SSadaf Ebrahimi 32*9a0e4156SSadaf Ebrahimi # "data" instruction generated by SKIPDATA option has no detail 33*9a0e4156SSadaf Ebrahimi if insn.id == 0: 34*9a0e4156SSadaf Ebrahimi return 35*9a0e4156SSadaf Ebrahimi 36*9a0e4156SSadaf Ebrahimi if len(insn.operands) > 0: 37*9a0e4156SSadaf Ebrahimi print("\top_count: %u" % len(insn.operands)) 38*9a0e4156SSadaf Ebrahimi c = 0 39*9a0e4156SSadaf Ebrahimi for i in insn.operands: 40*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_REG: 41*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: REG = %s" % (c, insn.reg_name(i.reg))) 42*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_IMM: 43*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: IMM = 0x%s" % (c, to_x_32(i.imm))) 44*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_PIMM: 45*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: P-IMM = %u" % (c, i.imm)) 46*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_CIMM: 47*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: C-IMM = %u" % (c, i.imm)) 48*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_FP: 49*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: FP = %f" % (c, i.fp)) 50*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_SYSREG: 51*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: SYSREG = %u" % (c, i.reg)) 52*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_SETEND: 53*9a0e4156SSadaf Ebrahimi if i.setend == ARM_SETEND_BE: 54*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: SETEND = be" % c) 55*9a0e4156SSadaf Ebrahimi else: 56*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: SETEND = le" % c) 57*9a0e4156SSadaf Ebrahimi if i.type == ARM_OP_MEM: 58*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].type: MEM" % c) 59*9a0e4156SSadaf Ebrahimi if i.mem.base != 0: 60*9a0e4156SSadaf Ebrahimi print("\t\t\toperands[%u].mem.base: REG = %s" \ 61*9a0e4156SSadaf Ebrahimi % (c, insn.reg_name(i.mem.base))) 62*9a0e4156SSadaf Ebrahimi if i.mem.index != 0: 63*9a0e4156SSadaf Ebrahimi print("\t\t\toperands[%u].mem.index: REG = %s" \ 64*9a0e4156SSadaf Ebrahimi % (c, insn.reg_name(i.mem.index))) 65*9a0e4156SSadaf Ebrahimi if i.mem.scale != 1: 66*9a0e4156SSadaf Ebrahimi print("\t\t\toperands[%u].mem.scale: %u" \ 67*9a0e4156SSadaf Ebrahimi % (c, i.mem.scale)) 68*9a0e4156SSadaf Ebrahimi if i.mem.disp != 0: 69*9a0e4156SSadaf Ebrahimi print("\t\t\toperands[%u].mem.disp: 0x%s" \ 70*9a0e4156SSadaf Ebrahimi % (c, to_x_32(i.mem.disp))) 71*9a0e4156SSadaf Ebrahimi if i.mem.lshift != 0: 72*9a0e4156SSadaf Ebrahimi print("\t\t\toperands[%u].mem.lshift: 0x%s" \ 73*9a0e4156SSadaf Ebrahimi % (c, to_x_32(i.mem.lshift))) 74*9a0e4156SSadaf Ebrahimi 75*9a0e4156SSadaf Ebrahimi if i.neon_lane != -1: 76*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].neon_lane = %u" % (c, i.neon_lane)) 77*9a0e4156SSadaf Ebrahimi 78*9a0e4156SSadaf Ebrahimi if i.access == CS_AC_READ: 79*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].access: READ\n" % (c)) 80*9a0e4156SSadaf Ebrahimi elif i.access == CS_AC_WRITE: 81*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].access: WRITE\n" % (c)) 82*9a0e4156SSadaf Ebrahimi elif i.access == CS_AC_READ | CS_AC_WRITE: 83*9a0e4156SSadaf Ebrahimi print("\t\toperands[%u].access: READ | WRITE\n" % (c)) 84*9a0e4156SSadaf Ebrahimi 85*9a0e4156SSadaf Ebrahimi if i.shift.type != ARM_SFT_INVALID and i.shift.value: 86*9a0e4156SSadaf Ebrahimi print("\t\t\tShift: %u = %u" \ 87*9a0e4156SSadaf Ebrahimi % (i.shift.type, i.shift.value)) 88*9a0e4156SSadaf Ebrahimi if i.vector_index != -1: 89*9a0e4156SSadaf Ebrahimi print("\t\t\toperands[%u].vector_index = %u" %(c, i.vector_index)) 90*9a0e4156SSadaf Ebrahimi if i.subtracted: 91*9a0e4156SSadaf Ebrahimi print("\t\t\toperands[%u].subtracted = True" %c) 92*9a0e4156SSadaf Ebrahimi 93*9a0e4156SSadaf Ebrahimi c += 1 94*9a0e4156SSadaf Ebrahimi 95*9a0e4156SSadaf Ebrahimi if insn.update_flags: 96*9a0e4156SSadaf Ebrahimi print("\tUpdate-flags: True") 97*9a0e4156SSadaf Ebrahimi if insn.writeback: 98*9a0e4156SSadaf Ebrahimi print("\tWrite-back: True") 99*9a0e4156SSadaf Ebrahimi if not insn.cc in [ARM_CC_AL, ARM_CC_INVALID]: 100*9a0e4156SSadaf Ebrahimi print("\tCode condition: %u" % insn.cc) 101*9a0e4156SSadaf Ebrahimi if insn.cps_mode: 102*9a0e4156SSadaf Ebrahimi print("\tCPSI-mode: %u" %(insn.cps_mode)) 103*9a0e4156SSadaf Ebrahimi if insn.cps_flag: 104*9a0e4156SSadaf Ebrahimi print("\tCPSI-flag: %u" %(insn.cps_flag)) 105*9a0e4156SSadaf Ebrahimi if insn.vector_data: 106*9a0e4156SSadaf Ebrahimi print("\tVector-data: %u" %(insn.vector_data)) 107*9a0e4156SSadaf Ebrahimi if insn.vector_size: 108*9a0e4156SSadaf Ebrahimi print("\tVector-size: %u" %(insn.vector_size)) 109*9a0e4156SSadaf Ebrahimi if insn.usermode: 110*9a0e4156SSadaf Ebrahimi print("\tUser-mode: True") 111*9a0e4156SSadaf Ebrahimi if insn.mem_barrier: 112*9a0e4156SSadaf Ebrahimi print("\tMemory-barrier: %u" %(insn.mem_barrier)) 113*9a0e4156SSadaf Ebrahimi 114*9a0e4156SSadaf Ebrahimi (regs_read, regs_write) = insn.regs_access() 115*9a0e4156SSadaf Ebrahimi 116*9a0e4156SSadaf Ebrahimi if len(regs_read) > 0: 117*9a0e4156SSadaf Ebrahimi print("\tRegisters read:", end="") 118*9a0e4156SSadaf Ebrahimi for r in regs_read: 119*9a0e4156SSadaf Ebrahimi print(" %s" %(insn.reg_name(r)), end="") 120*9a0e4156SSadaf Ebrahimi print("") 121*9a0e4156SSadaf Ebrahimi 122*9a0e4156SSadaf Ebrahimi if len(regs_write) > 0: 123*9a0e4156SSadaf Ebrahimi print("\tRegisters modified:", end="") 124*9a0e4156SSadaf Ebrahimi for r in regs_write: 125*9a0e4156SSadaf Ebrahimi print(" %s" %(insn.reg_name(r)), end="") 126*9a0e4156SSadaf Ebrahimi print("") 127*9a0e4156SSadaf Ebrahimi 128*9a0e4156SSadaf Ebrahimi 129*9a0e4156SSadaf Ebrahimi# ## Test class Cs 130*9a0e4156SSadaf Ebrahimidef test_class(): 131*9a0e4156SSadaf Ebrahimi 132*9a0e4156SSadaf Ebrahimi for (arch, mode, code, comment, syntax) in all_tests: 133*9a0e4156SSadaf Ebrahimi print("*" * 16) 134*9a0e4156SSadaf Ebrahimi print("Platform: %s" % comment) 135*9a0e4156SSadaf Ebrahimi print("Code: %s" % to_hex(code)) 136*9a0e4156SSadaf Ebrahimi print("Disasm:") 137*9a0e4156SSadaf Ebrahimi 138*9a0e4156SSadaf Ebrahimi try: 139*9a0e4156SSadaf Ebrahimi md = Cs(arch, mode) 140*9a0e4156SSadaf Ebrahimi if syntax is not None: 141*9a0e4156SSadaf Ebrahimi md.syntax = syntax 142*9a0e4156SSadaf Ebrahimi md.detail = True 143*9a0e4156SSadaf Ebrahimi for insn in md.disasm(code, 0x80001000): 144*9a0e4156SSadaf Ebrahimi print_insn_detail(insn) 145*9a0e4156SSadaf Ebrahimi print () 146*9a0e4156SSadaf Ebrahimi except CsError as e: 147*9a0e4156SSadaf Ebrahimi print("ERROR: %s" % e) 148*9a0e4156SSadaf Ebrahimi 149*9a0e4156SSadaf Ebrahimi 150*9a0e4156SSadaf Ebrahimiif __name__ == '__main__': 151*9a0e4156SSadaf Ebrahimi test_class() 152