LIEF/examples/python/macho_reader.py

593 lines
18 KiB
Python
Executable File

#!/usr/bin/env python
# -*- coding: utf-8 -*-
# Description
# -----------
# Print information about a Mach-O binary
import sys
import os
import argparse
import traceback
import lief
from lief import MachO
from lief import Logger
Logger.set_level(lief.LOGGING_LEVEL.INFO)
terminal_rows, terminal_columns = 100, 100
try:
terminal_rows, terminal_columns = os.popen('stty size', 'r').read().split()
except ValueError:
pass
terminal_columns = int(terminal_columns)
terminal_rows = int(terminal_rows)
class exceptions_handler(object):
func = None
def __init__(self, exceptions, on_except_callback=None):
self.exceptions = exceptions
self.on_except_callback = on_except_callback
def __call__(self, *args, **kwargs):
if self.func is None:
self.func = args[0]
return self
try:
return self.func(*args, **kwargs)
except self.exceptions as e:
if self.on_except_callback is not None:
self.on_except_callback(e)
else:
print("-" * 60)
print("Exception in {}: {}".format(self.func.__name__, e))
exc_type, exc_value, exc_traceback = sys.exc_info()
traceback.print_tb(exc_traceback)
print("-" * 60)
@exceptions_handler(Exception)
def print_information(binary):
print("== Information ==")
format_str = "{:<30} {:<30}"
format_hex = "{:<30} 0x{:<28x}"
format_dec = "{:<30} {:<30d}"
print(format_str.format("Name:", binary.name))
print(format_hex.format("Address base:", binary.imagebase))
print(format_str.format("PIE:", str(binary.is_pie)))
print(format_str.format("NX:", str(binary.has_nx)))
print("")
@exceptions_handler(Exception)
def print_header(binary):
format_str = "{:<33} {:<30}"
format_hex = "{:<33} 0x{:<28x}"
format_dec = "{:<33} {:<30d}"
print("== Header ==")
header = binary.header
flags_str = " - ".join([str(s).split(".")[-1] for s in header.flags_list])
print(format_str.format("Magic:", str(header.magic).split(".")[-1]))
print(format_str.format("CPU Type:", str(header.cpu_type).split(".")[-1]))
print(format_hex.format("CPU sub-type:", header.cpu_subtype))
print(format_str.format("File Type:", str(header.file_type).split(".")[-1]))
print(format_str.format("Flags:", flags_str))
print(format_dec.format("Number of commands:", header.nb_cmds))
print(format_hex.format("Size of commands:", header.sizeof_cmds))
print(format_hex.format("Reserved:", header.reserved))
@exceptions_handler(Exception)
def print_commands(binary):
f_title = "|{:<20}|{:<11}|{:<11}|"
f_value = "|{:<20}|0x{:08x} |0x{:08x} |"
print("== Commands ==")
print(f_title.format("Command", "Offset", "Size"))
for command in binary.commands:
print(f_value.format(
str(command.command).split(".")[-1],
command.command_offset,
command.size))
print("")
@exceptions_handler(Exception)
def print_libraries(binary):
f_title = "|{:<30}|{:<10}|{:<16}|{:<22}|"
f_value = "|{:<30}|{:<10d}|{:<16x}|{:<22x}|"
print("== Libraries ==")
print(f_title.format("Name", "Timestamp", "Current Version", "Compatibility Version"))
for library in binary.libraries:
print(f_value.format(
library.name,
library.timestamp,
library.current_version,
library.compatibility_version))
print("")
@exceptions_handler(Exception)
def print_segments(binary):
f_title = "|{:<20}|{:<16}|{:<16}|{:<16}|{:16}|{:16}|{:16}|{}"
f_value = "|{:<20}|0x{:<13x} |0x{:<13x} |0x{:<13x} |0x{:<13x} |0x{:<13x} |0x{:<13x} |{}"
print("== Segments ==")
print(f_title.format(
"Name", "Virtual Address", "Virtual Size",
"Offset", "Size", "Max Protection",
"Init Protection", "Sections"))
for segment in binary.segments:
sections = ", ".join(map(lambda s : s.name, segment.sections))
print(f_value.format(
segment.name,
segment.virtual_address,
segment.virtual_size,
segment.file_offset,
segment.file_size,
segment.max_protection,
segment.init_protection,
sections))
print("")
@exceptions_handler(Exception)
def print_sections(binary):
f_title = "|{:<20}|{:<16}|{:<16}|{:<16}|{:16}|{:22}|{:19}|{:25}|"
f_value = "|{:<20}|0x{:<13x} |0x{:<13x} |0x{:<13x} |0x{:<13x} |0x{:<19x} |0x{:<16x} |{:<25}|"
print("== Sections ==")
print(f_title.format(
"Name", "Virtual Address", "Offset", "Size",
"Alignement", "Number of Relocations", "Relocation offset",
"Type"))
for section in binary.sections:
print(f_value.format(
section.name,
section.virtual_address,
section.offset,
section.size,
section.alignment,
section.numberof_relocations,
section.relocation_offset,
str(section.type).split(".")[-1]))
if len(section.relocations) > 0:
for idx, reloc in enumerate(section.relocations):
name = reloc.symbol.name if reloc.has_symbol else ""
secname = " - " + reloc.section.name if reloc.has_section else ""
type = str(reloc.type)
if reloc.architecture == MachO.CPU_TYPES.x86:
type = str(MachO.X86_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.x86_64:
type = str(MachO.X86_64_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.ARM:
type = str(MachO.ARM_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.ARM64:
type = str(MachO.ARM64_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.POWERPC:
type = str(MachO.PPC_RELOCATION(reloc.type))
print(" [Reloc #{:d} {section}] {name:<10} 0x{address:<6x} {type:<20} {size:d} {pcrel} {scat}".format(
idx,
section=secname,
name=name,
address=reloc.address,
type=type.split(".")[-1],
size=reloc.size,
pcrel=str(reloc.pc_relative),
scat=str(reloc.is_scattered)))
print("")
print("")
@exceptions_handler(Exception)
def print_symbols(binary):
symbols = binary.symbols
if len(symbols) == 0:
return
try:
maxsize = max([len(symbol.demangled_name) for symbol in symbols])
except:
maxsize = max([len(symbol.name) for symbol in symbols])
maxsize = min(maxsize, terminal_columns - 90) if terminal_columns > 90 else terminal_columns
f_title = "|{:<" + str(maxsize) + "} |{:<6}|{:<19}|{:<16}|{:16}| {:s}"
f_value = "|{:<" + str(maxsize) + "} |0x{:<3x} |0x{:<16x} |0x{:<13x} |0x{:<13x} | {:s}"
print("== Symbols ==")
print(f_title.format(
"Name", "Type", "Number of Sections", "Description", "Value", "Library"))
for symbol in binary.symbols:
libname = ""
if symbol.has_binding_info and symbol.binding_info.has_library:
libname = symbol.binding_info.library.name
symbol_value = symbol.value if symbol.value > 0 or not symbol.has_binding_info else symbol.binding_info.address
try:
symbol_name = symbol.demangled_name
except:
symbol_name = symbol.name
print(f_value.format(
symbol_name,
symbol.type,
symbol.numberof_sections,
symbol.description,
symbol_value,
libname))
print("")
@exceptions_handler(Exception)
def print_uuid(binary):
print("== UUID ==")
cmd = binary.uuid
uuid_str = " ".join(map(lambda e : "{:02x}".format(e), cmd.uuid))
print("UUID: {}".format(uuid_str))
print("")
@exceptions_handler(Exception)
def print_main_command(binary):
format_str = "{:<13} {:<30}"
format_hex = "{:<13} 0x{:<28x}"
format_dec = "{:<13} {:<30d}"
print("== Main Command ==")
cmd = binary.main_command
print(format_hex.format("Entry point:", cmd.entrypoint))
print(format_hex.format("Stack size:", cmd.stack_size))
print("")
@exceptions_handler(Exception)
def print_thread_command(binary):
format_str = "{:<13} {:<30}"
format_hex = "{:<13} 0x{:<28x}"
format_dec = "{:<13} {:<30d}"
print("== Thread Command ==")
cmd = binary.thread_command
print(format_hex.format("Flavor:", cmd.flavor))
print(format_hex.format("Count:", cmd.count))
print(format_hex.format("PC:", cmd.pc))
print("")
@exceptions_handler(Exception)
def print_rpath_command(binary):
format_str = "{:<13} {:<30}"
format_hex = "{:<13} 0x{:<28x}"
format_dec = "{:<13} {:<30d}"
print("== Rpath Command ==")
cmd = binary.rpath
print("Path: {}".format(cmd.path))
print("")
@exceptions_handler(Exception)
def print_dylinker(binary):
print("== Dylinker ==")
print("Path: {}".format(binary.dylinker.name))
print("")
@exceptions_handler(Exception)
def print_function_starts(binary):
format_str = "{:<13} {:<30}"
format_hex = "{:<13} 0x{:<28x}"
format_dec = "{:<13} {:<30d}"
print("== Function Starts ==")
fstarts = binary.function_starts
print(format_hex.format("Offset:", fstarts.data_offset))
print(format_hex.format("Size:", fstarts.data_size))
print("Functions: ({:d})".format(len(fstarts.functions)))
for idx, address in enumerate(fstarts.functions):
print(" [{:d}] __TEXT + 0x{:x}".format(idx, address))
print("")
@exceptions_handler(Exception)
def print_dyld_info(binary):
print("== Dyld Info ==")
f_title = "|{:<12}|{:<11}|{:<11}|"
f_value = "|{:<12}|0x{:<8x} |0x{:<8x} |"
dyld_info = binary.dyld_info
print(f_title.format("Type", "Offset", "Size"))
print(f_value.format("Rebase", dyld_info.rebase[0], dyld_info.rebase[1]))
print(f_value.format("Bind", dyld_info.bind[0], dyld_info.bind[1]))
print(f_value.format("Weak Bind", dyld_info.weak_bind[0], dyld_info.weak_bind[1]))
print(f_value.format("Lazy Bind", dyld_info.lazy_bind[0], dyld_info.lazy_bind[1]))
print(f_value.format("Export", dyld_info.export_info[0], dyld_info.export_info[1]))
print("")
print("Bindings")
print("--------")
for idx, binfo in enumerate(dyld_info.bindings):
print("{:10}: {}".format("Class", str(binfo.binding_class).split(".")[-1]))
print("{:10}: {}".format("Type", str(binfo.binding_type).split(".")[-1]))
print("{:10}: {:x}".format("Address", binfo.address))
if binfo.has_symbol:
print("{:10}: {}".format("Symbol", binfo.symbol.name))
if binfo.has_segment:
print("{:10}: {}".format("Segment", binfo.segment.name))
if binfo.has_library:
print("{:10}: {}".format("Library", binfo.library.name))
print("")
print("")
print("Exports")
print("-------")
for idx, einfo in enumerate(dyld_info.exports):
print("{:10}: {:<10x}".format("Address", einfo.address))
print("{:10}: {:<10x}".format("Flags", einfo.flags))
if binfo.has_symbol:
print("{:10}: {}".format("Symbol", einfo.symbol.name))
print("")
print("")
@exceptions_handler(Exception)
def print_source_version(binary):
print("== Source Version ==")
version = binary.source_version.version
print("Version: {:d}.{:d}.{:d}.{:d}.{:d}".format(*version))
print("")
@exceptions_handler(Exception)
def print_version_min(binary):
print("== Version Min ==")
version = binary.version_min.version
sdk = binary.version_min.sdk
print("Version: {:d}.{:d}.{:d}".format(*version))
print("SDK: {:d}.{:d}.{:d}".format(*sdk))
print("")
@exceptions_handler(Exception)
def print_relocations(binary):
print("== Relocations ==")
f_value = "|0x{address:<10x} | {size:<4d} | {type:<15} | {pcrel:<11} | {secseg:<23} | {symbol}"
f_title = "|{address:<12} | {size:<4} | {type:<15} | {pcrel:<11} | {secseg:<23} | {symbol}"
print(f_title.format(
address="Address",
size="Size",
type="Type",
pcrel="PC Relative",
secseg="Section/Section",
symbol="Symbol"))
for reloc in binary.relocations:
type_str = ""
if reloc.origin == lief.MachO.RELOCATION_ORIGINS.DYLDINFO:
type_str = str(lief.MachO.REBASE_TYPES(reloc.type)).split(".")[-1]
if reloc.origin == lief.MachO.RELOCATION_ORIGINS.RELOC_TABLE:
if reloc.architecture == MachO.CPU_TYPES.x86:
type_str = str(MachO.X86_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.x86_64:
type_str = str(MachO.X86_64_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.ARM:
type_str = str(MachO.ARM_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.ARM64:
type_str = str(MachO.ARM64_RELOCATION(reloc.type))
if reloc.architecture == MachO.CPU_TYPES.POWERPC:
type_str = str(MachO.PPC_RELOCATION(reloc.type))
type_str = type_str.split(".")[-1]
symbol_name = ""
if reloc.has_symbol:
symbol_name = reloc.symbol.name
secseg_name = ""
if reloc.has_segment and reloc.has_section:
secseg_name = "{}.{}".format(reloc.segment.name, reloc.section.name)
else:
if reloc.has_segment:
secseg_name = reloc.segment.name
if reloc.has_section:
secseg_name = reloc.section.name
print(f_value.format(
address=reloc.address,
size=reloc.size,
type=type_str,
pcrel=str(reloc.pc_relative),
secseg=secseg_name,
symbol=symbol_name))
print("")
def main():
parser = argparse.ArgumentParser(usage='%(prog)s [options] <macho-file>')
parser.add_argument('-a', '--all',
action='store_true', dest='show_all',
help='Show all information')
parser.add_argument('-c', '--commands',
action='store_true', dest='show_commands',
help='Display Commands')
parser.add_argument('-H', '--header',
action='store_true', dest='show_header',
help='Display header')
parser.add_argument('-L', '--libraries',
action='store_true', dest='show_libraries',
help='Display Imported Libraries')
parser.add_argument('-l', '--segments',
action='store_true', dest='show_segments',
help='Display Segments')
parser.add_argument('-r', '--relocations',
action='store_true', dest='show_relocs',
help='Display the relocations (if present)')
parser.add_argument('-s', '--symbols',
action='store_true', dest='show_symbols',
help='Display Symbols')
parser.add_argument('-S', '--sections',
action='store_true', dest='show_sections',
help='Display Sections')
parser.add_argument('--uuid',
action='store_true', dest='show_uuid',
help='Display the UUID command')
parser.add_argument('--main',
action='store_true', dest='show_main',
help='Display the Main command')
parser.add_argument('--dylinker',
action='store_true', dest='show_dylinker',
help='Display the Dylinker command')
parser.add_argument('--dyldinfo',
action='store_true', dest='show_dyldinfo',
help='Display the DyldInfo command')
parser.add_argument('--function-starts',
action='store_true', dest='show_function_starts',
help='Display the FunctionStarts command')
parser.add_argument('--source-version',
action='store_true', dest='show_source_version',
help="Display the 'Source Version' command")
parser.add_argument('--version-min',
action='store_true', dest='show_version_min',
help="Display the 'Version Min' command")
parser.add_argument('--thread-command',
action='store_true', dest='show_thread_command',
help="Display the 'Thread Command' command")
parser.add_argument('--rpath-command',
action='store_true', dest='show_rpath_command',
help="Display the 'Rpath Command' command")
parser.add_argument("binary",
metavar="<macho-file>",
help='Target Mach-O File')
args = parser.parse_args()
binaries = None
try:
binaries = MachO.parse(args.binary)
except lief.exception as e:
print(e)
sys.exit(1)
for binary in binaries:
print_information(binary)
if args.show_header or args.show_all:
print_header(binary)
if args.show_commands or args.show_all:
print_commands(binary)
if args.show_libraries or args.show_all:
print_libraries(binary)
if args.show_segments or args.show_all:
print_segments(binary)
if args.show_sections or args.show_all:
print_sections(binary)
if args.show_symbols or args.show_all:
print_symbols(binary)
if (args.show_uuid or args.show_all) and binary.has_uuid:
print_uuid(binary)
if (args.show_main or args.show_all) and binary.has_main_command:
print_main_command(binary)
if (args.show_dylinker or args.show_all) and binary.has_dylinker:
print_dylinker(binary)
if (args.show_dyldinfo or args.show_all) and binary.has_dyld_info:
print_dyld_info(binary)
if (args.show_function_starts or args.show_all) and binary.has_function_starts:
print_function_starts(binary)
if (args.show_source_version or args.show_all) and binary.has_source_version:
print_source_version(binary)
if (args.show_version_min or args.show_all) and binary.has_version_min:
print_version_min(binary)
if (args.show_relocs or args.show_all) and len(binary.relocations) > 0:
print_relocations(binary)
if (args.show_thread_command or args.show_all) and binary.has_thread_command:
print_thread_command(binary)
if (args.show_rpath_command or args.show_all) and binary.has_rpath:
print_rpath_command(binary)
if __name__ == "__main__":
main()