#!/usr/bin/env python3 import lief import uuid import argparse import subprocess import os import sys import mmap import plistlib import json import sys import treelib import ctypes import stat import struct import threading import time ### --- I. MACH-O --- ### class MachOProcessor: def __init__(self, file_path): '''This class contains part of the code from the main() for the SnakeI: Mach-O part.''' self.file_path = os.path.abspath(file_path) def parseFatBinary(self): '''Return Fat Binary object.''' return lief.MachO.parse(self.file_path) def process(self, args): '''Executes the code for the SnakeI: Mach-O.''' if not os.path.exists(self.file_path): # Check if file_path specified in the --path argument exists. print(f'The file {self.file_path} does not exist.') exit() global binaries # It must be global, becuase after the MachOProcessor object is destructed, the snake_instance would point to invalid memory ("binary" is dependant on "binaries"). global snake_instance # Must be global for further processors classes. binaries = self.parseFatBinary() if binaries is None: exit() # Exit if the file is not valid macho snake_instance = SnakeVI(binaries, self.file_path) # Initialize the latest Snake class if args.file_type: # Print binary file type print(f'File type: {snake_instance.getFileType()}') if args.header_flags: # Print binary header flags header_flag_list = snake_instance.getHeaderFlags() print("Header flags:", " ".join(header_flag.__name__ for header_flag in header_flag_list)) if args.endian: # Print binary endianess print(f'Endianess: {snake_instance.getEndianess()}') if args.header: # Print binary header print(snake_instance.getBinaryHeader()) if args.load_commands: # Print binary load commands load_commands_list = snake_instance.getLoadCommands() print("Load Commands:", " ".join(load_command.command.__name__ for load_command in load_commands_list)) if args.has_cmd: # Check if LC exist snake_instance.printHasLoadCommand(args.has_cmd) if args.segments: # Print binary segments in human friendly form for segment in snake_instance.getSegments(): print(segment) if args.has_segment: # Check if binary has given __SEGMENT snake_instance.printHasSegment(args.has_segment) if args.sections: # Print binary sections in human friendly form for section in snake_instance.getSections(): print(section) if args.has_section: # Check if binary has given __SEGMENT,__section snake_instance.printHasSection(args.has_section) if args.symbols: # Print symbols for symbol in snake_instance.getSymbols(): print(f"0x{symbol.value:016X} {symbol.name}") if args.imports: # Print imported symbols snake_instance.printImports() if args.exports: # Print exported symbols snake_instance.printExports() if args.imported_symbols: snake_instance.printImportedSymbols() if args.chained_fixups: # Print Chained Fixups information print(snake_instance.getChainedFixups()) if args.exports_trie: # Print Exports Trie information print(snake_instance.getExportTrie()) if args.uuid: # Print UUID print(f'UUID: {snake_instance.getUUID()}') if args.main: # Print entry point and stack size snake_instance.printMain() if args.encryption_info is not None: # Print encryption info and save encrypted data if path is specified snake_instance.printEncryptionInfo(args.encryption_info) if args.strings_section: # Print strings from __cstring section print('Strings from __cstring section:') print('-------------------------------') for string in (snake_instance.getStringSection()): print(string) if args.all_strings: # Print strings from all sections. print(snake_instance.findAllStringsInBinary()) if args.save_strings: # Parse all sections, detect strings and save them to a file extracted_strings = snake_instance.findAllStringsInBinary() with open(args.save_strings, 'a') as f: for s in extracted_strings: f.write(s) if args.info: # Print all info about the binary print('\n<=== HEADER ===>') print(snake_instance.getBinaryHeader()) print('\n<=== LOAD COMMANDS ===>') for lcd in snake_instance.getLoadCommands(): print(lcd) print("="*50) print('\n<=== SEGMENTS ===>') for segment in snake_instance.getSegments(): print(segment) print('\n<=== SECTIONS ===>') for section in snake_instance.getSections(): print(section) print('\n<=== SYMBOLS ===>') for symbol in snake_instance.getSymbols(): print(f"{(symbol.name).ljust(32)} {hex(symbol.value)}") print('\n<=== STRINGS ===>') print('Strings from __cstring section:') print('-------------------------------') for string in (snake_instance.getStringSection()): print(string) if snake_instance.binary.has_encryption_info: print('\n<=== ENCRYPTION INFO ===>') snake_instance.printEncryptionInfo() print('\n<=== UUID ===>') print(f'{snake_instance.getUUID()}') print('\n<=== ENDIANESS ===>') print(snake_instance.getEndianess()) print('\n<=== ENTRYPOINT ===>') snake_instance.printMain() if args.dump_data: # Dump {size} bytes starting from {offset} to a given {filename}. snake_instance.dumpDataArgParser(args.dump_data) if args.calc_offset: # Calculate the real address of the Virtual Memory in the file. snake_instance.printCalcRealAddressFromVM(args.calc_offset) if args.constructors: # Print constructors snake_instance.printConstructors() class SnakeI: def __init__(self, binaries, file_path): ''' When initiated, the program parses a Universal binary (binaries parameter) and extracts the ARM64 Mach-O. If the file is not in a universal format but is a valid ARM64 Mach-O, it is taken as a binary parameter during initialization. ''' self.binary = self.parseFatBinary(binaries) self.file_path = file_path self.segments_count, self.file_start, self.file_size, self.file_end = self.getSegmentsInfo() self.load_commands = self.getLoadCommands() self.endianess = self.getEndianess() self.format_specifier = 'I' # For struct.pack self.reversed_format_specifier = '>I' if self.getEndianess() == 'little' else ' file_size: raise ValueError("Offset and size exceed the binary file's length.") # Seek to the offset considering the fat_offset file.seek(offset) # Read the specified size of bytes extracted_bytes = file.read(size) return extracted_bytes def saveBytesToFile(self, data, filename): ''' Save bytes to a file. ''' with open(filename, 'wb') as file: file.write(data) def readBytesFromFile(self, filename): ''' Read bytes from a file. ''' with open(filename, 'rb') as file: data = file.read() return data def dumpData(self, offset, size, filename): ''' Extract {size} bytes starting from {offset} to a given {filename}. ''' extracted_bytes = self.extractBytesAtOffset(offset, size) if extracted_bytes: self.saveBytesToFile(extracted_bytes, filename) def dumpDataArgParser(self, args): ''' Parse comma separated values for dumpData from --dump_data 'offset,size,filename'. ''' offset, size, filename = args.split(',') offset = offset.strip().lower() if offset.startswith("0x"): offset = int(offset, 16) size = size.strip().lower() if size.startswith("0x"): size = int(size, 16) filename = filename.strip() self.dumpData(offset, size, filename) def saveEcryptedData(self, output_path): '''Method for saving encrypted data sector to specified file.''' _, cryptoff, cryptsize = self.getEncryptionInfo() self.saveBytesToFile(self.extractBytesAtOffset(cryptoff + self.fat_offset, cryptsize), output_path) def hasSection(self, segment_section): ''' Takes "__SEGMENT,__section" as an input. Return True if it exists. ''' segment_section = segment_section.lower() for section in self.binary.sections: current_segment_section = f'{section.segment_name},{section.name}'.lower() if current_segment_section == segment_section: return True return False def printHasSection(self, segment_section): ''' Printing function for --has_section. ''' if self.hasSection(segment_section): print(f'{self.file_path} has {segment_section}') def extractSection(self, segment_name, section_name): ''' As argument takes segment name (e.g. "__PRELINK_INFO") and section name that is a part of the segment (e.g. '__text'). Return data (bytes) stored in a given section. If section was not found or is empty -> return False. ''' segment_section = f'{segment_name},{section_name}' if not self.hasSection(segment_section): # If section was not found, break. return False section_offset_start, section_offset_end = self.getSectionRange(segment_name, section_name) if section_offset_start and section_offset_end: size = section_offset_end - section_offset_start extracted_bytes = self.extractBytesAtOffset(section_offset_start, size) return extracted_bytes return False def dumpSection(self, segment_name, section_name, filename): ''' Dump '__SEGMENT,__section' to a given file. Reutrn False if the section does not exist. ''' extracted_bytes = self.extractSection(segment_name, section_name) if extracted_bytes: self.saveBytesToFile(extracted_bytes, filename) return True return False def hasLoadCommand(self, load_command): ''' Check if the given Load Command exists in the binary. ''' if load_command.startswith("LC_"): load_command = load_command[3:] load_command = load_command.lower() for cmd in self.load_commands: cmd = str(cmd.command.__name__).lower() if load_command == cmd: return True return False def printHasLoadCommand(self, load_command): ''' Printing function for has_cmd. ''' original_user_input = load_command if self.hasLoadCommand(load_command): print(f'{self.file_path} has {original_user_input}') def getVirtualMemoryStartingAddress(self): ''' Get start VM base addr of the __TEXT segment ''' vm_base = 0 if self.hasSegment('__TEXT'): for segment in self.binary.segments: if segment.name == '__TEXT': vm_base = segment.virtual_address return vm_base def calcRealAddressFromVM(self, vm_offset): ''' Calculate the real address of the Virtual Memory in the file. vm_start == __TEXT segment vm_offset == your address real = vm_offset - vm_start ''' # Handling strings and hexes if type(vm_offset) is not int: if (vm_offset.lower()).startswith("0x"): vm_offset = int(vm_offset, 16) else: vm_offset = int(vm_offset) vm_base = self.getVirtualMemoryStartingAddress() vm_offset = vm_offset - vm_base return vm_offset def printCalcRealAddressFromVM(self, vm_offset): ''' Printing function for --calc_offset ''' real_offset = self.calcRealAddressFromVM(vm_offset) real_offset_hex = hex(real_offset) print(f'{vm_offset} : {real_offset_hex}') def printConstructors(self): ''' Print all constructors functions from the binary. ''' for ctor in self.binary.ctor_functions: print(ctor) ### --- II. CODE SIGNING --- ### class CodeSigningProcessor: def __init__(self): '''This class contains part of the code from the main() for the SnakeII: Code Signing.''' pass def process(self, args): if args.verify_signature: # Verify if Code Signature match the binary content () if snake_instance.isSigValid(snake_instance.file_path): print("Valid Code Signature (matches the content)") else: print("Invalid Code Signature (does not match the content)") if args.cd_info: # Print Code Signature information print(snake_instance.getCodeSignature(snake_instance.file_path).decode('utf-8')) if args.cd_requirements: # Print Requirements. print(snake_instance.getCodeSignatureRequirements(snake_instance.file_path).decode('utf-8')) if args.entitlements: # Print Entitlements. print(snake_instance.getEntitlementsFromCodeSignature(snake_instance.file_path, args.entitlements)) if args.extract_cms: # Extract the CMS Signature and save it to a given file. cms_signature = snake_instance.extractCMS() snake_instance.saveBytesToFile(cms_signature, args.extract_cms) if args.extract_certificates: # Extract Certificates and save them to a given file. snake_instance.extractCertificatesFromCodeSignature(args.extract_certificates) if args.remove_sig: # Save a new file on a disk with the removed signature: snake_instance.removeCodeSignature(args.remove_sig) if args.sign_binary: # Sign the given binary using specified identity: snake_instance.signBinary(args.sign_binary) if args.cs_offset: # Print Code Signature offset snake_instance.printCodeSignatureOffset() if args.cs_flags: # Print Code Signature flags snake_instance.printCodeSignatureFlags() class SnakeII(SnakeI): def __init__(self, binaries, file_path): super().__init__(binaries, file_path) self.magic_bytes = (0xFADE0B01).to_bytes(4, byteorder='big') # CMS Signature Blob magic bytes, as Code Signature as a whole is in network byte order(big endian). def isSigValid(self, file_path): '''Checks if the Code Signature is valid (if the contents of the binary have been modified.)''' result = subprocess.run(["codesign", "-v", file_path], capture_output=True) if result.stderr == b'': return True else: return False def getCodeSignature(self, file_path): '''Returns information about the Code Signature.''' result = subprocess.run(["codesign", "-d", "-vvvvvv", file_path], capture_output=True) return result.stderr def getCodeSignatureRequirements(self, file_path): '''Returns information about the Code Signature Requirements.''' result = subprocess.run(["codesign", "-d", "-r", "-", file_path], capture_output=True) return result.stdout def getEntitlementsFromCodeSignature(self, file_path, format=None): '''Returns information about the Entitlements for Code Signature.''' if format == 'human' or format == None: result = subprocess.run(["codesign", "-d", "--entitlements", "-", file_path], capture_output=True) return result.stdout.decode('utf-8') elif format == 'xml': result = subprocess.run(["codesign", "-d", "--entitlements", "-", "--xml", file_path], capture_output=True) elif format == 'der': result = subprocess.run(["codesign", "-d", "--entitlements", "-", "--der", file_path], capture_output=True) return result.stdout def extractCMS(self): '''Find the offset of magic bytes in a binary using LIEF.''' cs = self.binary.code_signature cs_content = bytes(cs.content) offset = cs_content.find(self.magic_bytes) cms_len_in_bytes = cs_content[offset + 4:offset + 8] cms_len_in_int = int.from_bytes(cms_len_in_bytes, byteorder='big') cms_signature = cs_content[offset + 8:offset + 8 + cms_len_in_int] return cms_signature def extractCertificatesFromCodeSignature(self, cert_name): '''Extracts certificates from the CMS Signature and saves them to a file with _0, _1, _2 indexes at the end of the file names.''' subprocess.run(["codesign", "-d", f"--extract-certificates={cert_name}_", self.file_path], capture_output=True) def removeCodeSignature(self, new_name): '''Save new file on a disk with removed signature.''' self.binary.remove_signature() self.binary.write(new_name) def signBinary(self, security_identity=None): '''Sign binary using pseudo identity (adhoc) or specified identity.''' if security_identity == 'adhoc' or security_identity == None: result = subprocess.run(["codesign", "-s", "-", "-f", self.file_path], capture_output=True) return result.stdout.decode('utf-8') else: try: result = subprocess.run(["codesign", "-s", security_identity, "-f", self.file_path], capture_output=True) except Exception as e: print(f"An error occurred during Code Signing using {security_identity}\n {e}") def getCodeSignatureOffset(self): ''' Return the file offset of the Code Signature. Takes into account Fat binaries. ''' return self.binary.code_signature.data_offset + self.fat_offset def printCodeSignatureOffset(self): print(f'Code Signature offset: {hex(self.getCodeSignatureOffset())}') def getCodeSignatureSize(self): ''' Return Code Signature size. ''' return self.binary.code_signature.data_size def extractCodeSignatureBytes(self): ''' Extract the content of the Code Signature as raw bytes. Takes into account Fat binaries. ''' #The self.binary.code_signature.content.tobytes() takes into account Fat binaries, so no need to calculate the offset of valid signature manually. #cs_offset = self.getCodeSignatureOffset() #cs_size = self.getCodeSignatureSize() #cs_bytes = self.extractBytesAtOffset(cs_offset, cs_size) #self.saveBytesToFile(cs_bytes, 'test.bin') cs_bytes = self.binary.code_signature.content.tobytes() return cs_bytes def findBytes(self, magic, bytes): ''' Find [magic] bytes in a given [bytes]. ''' offset = bytes.find(magic) return offset def parseCodeDirectoryBlob(self): ''' Parse Code Directory blob from Code Signature to extract its version and then use AppleStructuresManager to parse the whole structure according to its version. ''' # Extracting version number CS_MAGIC_CODEDIRECTORY = 0xFADE0C02 cs_magic_codedirectory_as_bytes = struct.pack(self.reversed_format_specifier, CS_MAGIC_CODEDIRECTORY) cs_blob = self.extractCodeSignatureBytes() cs_directory_offset = self.findBytes(cs_magic_codedirectory_as_bytes, cs_blob) version_offset = cs_directory_offset + 8 version_bytes = cs_blob[version_offset:version_offset+4] version = struct.unpack(self.reversed_format_specifier, version_bytes)[0] # Extracting size size_offset = version_offset - 4 size_bytes = cs_blob[size_offset:size_offset+4] size = struct.unpack(self.reversed_format_specifier, size_bytes)[0] # Parsing __CodeDirectory code_directory_struct_instance = AppleStructuresManager.CodeDirectory(version) code_directory_dict = code_directory_struct_instance.parse(cs_blob[cs_directory_offset:size]) return code_directory_dict def getCodeSignatureFlags(self): ''' Extract CS flags: https://github.com/apple-oss-distributions/xnu/blob/1031c584a5e37aff177559b9f69dbd3c8c3fd30a/osfmk/kern/cs_blobs.h#L35''' code_directory_dict = self.parseCodeDirectoryBlob() return code_directory_dict['flags'] def printCodeSignatureFlags(self): print(f'CS_FLAGS: {hex(self.getCodeSignatureFlags())}') ### --- III. CHECKSEC --- ### class ChecksecProcessor: def __init__(self): '''This class contains part of the code from the main() for the SnakeIII: Checksec.''' pass def process(self, args): if args.has_pie: # Check if PIE is set in the header flags print("PIE: " + str(snake_instance.hasPIE())) if args.has_arc: # Check if ARC is in use print("ARC: " + str(snake_instance.hasARC())) if args.is_stripped: # Check if binary is stripped print("STRIPPED: " + str(snake_instance.isStripped())) if args.has_canary: # Check if binary has stack canary print("CANARY: " + str(snake_instance.hasCanary())) if args.has_nx_stack: # Check if binary has non executable stack print("NX STACK: " + str(snake_instance.hasNXstack())) if args.has_nx_heap: # Check if binary has non executable heap print("NX HEAP: " + str(snake_instance.hasNXheap())) if args.has_xn: # Check if binary is protected by eXecute Never functionality print(f"eXecute Never: {str(snake_instance.hasXN())}") if args.is_notarized: # Check if the application is notarized and can pass the Gatekeeper verification print("NOTARIZED: " + str(snake_instance.isNotarized(snake_instance.file_path))) if args.is_encrypted: # Check if the application has encrypted data print("ENCRYPTED: " + str(snake_instance.isEncrypted())) if args.is_restricted: # Check if the application has encrypted data print("RESTRICTED: " + str(snake_instance.isRestricted(snake_instance.file_path))) if args.is_hr: # Check if Hardened Runtime is in use print("HARDENED: " + str(snake_instance.hasHardenedRuntimeFlag(snake_instance.file_path))) if args.is_as: # Check if App Sandbox is in use print("APP SANDBOX: " + str(snake_instance.hasAppSandbox(snake_instance.file_path))) if args.is_fort: # Check if binary is fortified fortified_symbols = snake_instance.getForifiedSymbols() print("FORTIFIED: " + str(snake_instance.isFortified(fortified_symbols))) if args.has_rpath: # Check if binary has @rpaths print("RPATH: " + str(snake_instance.hasRpath())) if args.has_lv: # Check if binary is protected against Dylib Hijacking print("LIBRARY VALIDATION: " + str(snake_instance.checkDylibHijackingProtections(snake_instance.file_path))) if args.checksec: # Run all checks from above and present it in a table print("<==== CHECKSEC ======") print("PIE: ".ljust(16) + str(snake_instance.hasPIE())) print("ARC: ".ljust(16) + str(snake_instance.hasARC())) print("STRIPPED: ".ljust(16) + str(snake_instance.isStripped())) print("CANARY: ".ljust(16) + str(snake_instance.hasCanary())) print("NX STACK: ".ljust(16) + str(snake_instance.hasNXstack())) print("NX HEAP: ".ljust(16) + str(snake_instance.hasNXheap())) print("XN:".ljust(16) + str(snake_instance.hasXN())) print("NOTARIZED: ".ljust(16) + str(snake_instance.isNotarized(snake_instance.file_path))) print("ENCRYPTED: ".ljust(16) + str(snake_instance.isEncrypted())) print("RESTRICTED: ".ljust(16) + str(snake_instance.isRestricted(snake_instance.file_path))) print("HARDENED: ".ljust(16) + str(snake_instance.hasHardenedRuntimeFlag(snake_instance.file_path))) print("APP SANDBOX: ".ljust(16) + str(snake_instance.hasAppSandbox(snake_instance.file_path))) fortified_symbols = snake_instance.getForifiedSymbols() print("FORTIFIED: ".ljust(16) + str(snake_instance.isFortified(fortified_symbols))) print("RPATH: ".ljust(16) + str(snake_instance.hasRpath())) print("LV: ".ljust(16) + str(snake_instance.checkDylibHijackingProtections(snake_instance.file_path))) print("=====================>") class SnakeIII(SnakeII): def __init__(self, binaries, file_path): super().__init__(binaries, file_path) def hasPIE(self): '''Check if MH_PIE (0x00200000) is set in the header flags.''' return self.binary.is_pie def hasARC(self): '''Check if the _objc_release symbol is imported.''' for symbol in self.binary.symbols: if symbol.name.lower().strip() == '_objc_release': return True return False def isStripped(self): '''Check if binary is stripped.''' filter_symbols = ['radr://5614542', '__mh_execute_header'] for symbol in self.binary.symbols: symbol_type = symbol.type symbol_name = symbol.name.lower().strip() is_symbol_stripped = (symbol_type & 0xe0 > 0) or (symbol_type in [0x0e, 0x1e, 0x0f]) is_filtered = symbol_name not in filter_symbols if is_symbol_stripped and is_filtered: return False return True def hasCanary(self): '''Check whether in the binary there are symbols: ___stack_chk_fail and ___stack_chk_guard.''' canary_symbols = ['___stack_chk_fail', '___stack_chk_guard'] for symbol in self.binary.symbols: if symbol.name.lower().strip() in canary_symbols: return True return False def hasNXstack(self): '''Check if MH_ALLOW_STACK_EXECUTION (0x00020000 ) is not set in the header flags.''' return not bool(self.binary.header.flags & lief.MachO.HEADER_FLAGS.ALLOW_STACK_EXECUTION.value) def hasNXheap(self): '''Check if MH_NO_HEAP_EXECUTION (0x01000000 ) is set in the header flags.''' return bool(self.binary.header.flags & lief.MachO.HEADER_FLAGS.NO_HEAP_EXECUTION.value) def isXNos(): '''Check if the OS is running on the ARM architecture.''' system_info = os.uname() if "arm" in system_info.machine.lower(): return True return False def checkXNmap(): '''If XN is ON, you will not be able to map memory page that has W&X at the same time, so to check it, you can create such page.''' try: mmap.mmap(-1,4096, prot=mmap.PROT_READ | mmap.PROT_WRITE | mmap.PROT_EXEC) except mmap.error as e: #print(f"Failed to create W&X memory map - eXecute Never is supported on this machine. \n {str(e)}") return True return False def convertXMLEntitlementsToDict(self, entitlements_xml): '''Takes the Entitlements in XML format from getEntitlementsFromCodeSignature() method and convert them to a dictionary.''' return plistlib.loads(entitlements_xml) def convertDictEntitlementsToJson(self,entitlements_dict): '''Takes the Entitlements in dictionary format from convertXMLEntitlementsToDict() method and convert them to a JSON with indent 4.''' return json.dumps(entitlements_dict, indent=4) def checkIfEntitlementIsUsed(self, entitlement_name, entitlement_value, file_path): '''Check if the given entitlement exists and has the specified value.''' try: entitlements_xml = self.getEntitlementsFromCodeSignature(file_path, 'xml') if entitlements_xml == b'': # Return False if there are no entitlements return False entitlements_dict = self.convertXMLEntitlementsToDict(entitlements_xml) # Convert the entire parsed data to lowercase for case-insensitive comparison parsed_data = {key.lower(): value for key, value in entitlements_dict.items()} # Convert entitlement name and value to lowercase for case-insensitive and type-insensitive comparison entitlement_name_lower = entitlement_name.lower() entitlement_value_lower = str(entitlement_value).lower() if entitlement_name_lower in parsed_data and str(parsed_data[entitlement_name_lower]).lower() == entitlement_value_lower: return True else: return False except json.JSONDecodeError as e: # Handle JSON decoding error if any print(f"Error in checkIfEntitlementIsUsed: {e}") return False def hasAllowJITentitlement(self, file_path): '''Checks if the binary has missing com.apple.security.cs.allow-jit entitlement that allows the app to create writable and executable memory using the MAP_JIT flag.''' if self.checkIfEntitlementIsUsed('com.apple.security.cs.allow-jit', 'true', file_path): print(f"[INFO -> XN]: {os.path.basename(file_path)} contains allow-jit entitlement.") return True return False def checkIfCompiledForOtherThanARM(self): '''Iterates over FatBinary and check if there are other architectures than ARM.''' XN_types = [lief.MachO.CPU_TYPES.ARM64, lief.MachO.CPU_TYPES.ARM] for binary in binaries: if binary.header.cpu_type not in XN_types: print(f"[INFO -> XN]: {os.path.basename(file_path)} is compiled for other CPUs than ARM or ARM64.") return True return False def hasXN(self): '''Check if binary allows W&X via com.apple.security.cs.allow-jit entitlement or is compiled for other CPU types than these which supports eXecuteNever feature of ARM.''' if self.hasAllowJITentitlement(self.file_path) or self.checkIfCompiledForOtherThanARM(): return False return True def isNotarized(self, file_path): '''Verifies if the application is notarized and can pass the Gatekeeper verification.''' result = subprocess.run(["spctl", "-a", file_path], capture_output=True) if result.stderr == b'': return True else: #print(f"[INFO -> NOTARIZATION]: {result.stderr.decode().rstrip()}") return False def isEncrypted(self): '''If the cryptid has a non-zero value, some parts of the binary are encrypted.''' if self.binary.has_encryption_info: if self.binary.encryption_info.crypt_id == 1: return True return False def hasRestrictSegment(self): '''Check if binary contains __RESTRICT segment. Return True if it does.''' for segment in self.binary.segments: if segment.name.lower().strip() == "__restrict": return True return False def hasRestrictFlag(self, file_path): '''Check if Code Signature flag CS_RESTRICT 0x800(restrict) is set for the given binary''' if b'restrict' in self.getCodeSignature(file_path): return True return False def isRestricted(self, file_path): '''Check if binary has __RESTRICT segment or CS_RESTRICT flag set.''' if self.hasRestrictSegment() or self.hasRestrictFlag(file_path): return True return False def hasHardenedRuntimeFlag(self, file_path): '''Check if Hardened Runtime flag is set for the given binary.''' if b'runtime' in self.getCodeSignature(file_path): return True return False def hasAppSandbox(self, file_path): '''Check if App Sandbox is in use (com.apple.security.app-sandbox entitlement is set).''' if self.checkIfEntitlementIsUsed('com.apple.security.app-sandbox', 'true', file_path): return True return False def getForifiedSymbols(self): '''Check for symbol names that contain _chk suffix and filter out stack canary symbols. Function returns a list of all safe symbols.''' symbol_fiter = ['___stack_chk_fail', '___stack_chk_guard'] fortified_symbols = [] for symbol in self.binary.symbols: symbol_name = symbol.name.lower().strip() if ('_chk' in symbol_name) and (symbol_name not in symbol_fiter): fortified_symbols.append(symbol_name) return fortified_symbols def isFortified(self, fortified_symbols): '''Check if there are any fortified symbols in the give fortified_symbols list.''' if len(fortified_symbols) > 0: return True return False def hasRpath(self): return self.binary.has_rpath ### --- IV. DYLIBS --- ### class DylibsProcessor: def __init__(self): '''This class contains part of the code from the main() for the SnakeIV: Dylibs.''' pass def process(self, args): if args.dylibs: # Shared dylibs with unresolved paths snake_instance.printDylibs() if args.rpaths: # All resolved paths from LC_RPATHs snake_instance.printRpathsResolved() if args.rpaths_u: # All inresolved paths from LC_RPATHs snake_instance.printRpathsUnresolved() if args.dylibs_paths: # Resolved dylib loading paths in order they are searched for snake_instance.printResolvedDylibPaths() if args.dylibs_paths_u: # Unresolved dylib loading paths (same as --dylibs, but without version info) snake_instance.printUnresolvedDylibPaths() if args.broken_relative_paths: # Relative paths snake_instance.printBrokenRelativePaths() if args.dylibtree: # Dylibtree args_dylibtree = args.dylibtree.split(',') dylibtree = snake_instance.getDylibTree(args_dylibtree[0], args_dylibtree[1],args_dylibtree[2]) snake_instance.printTreeFromTreelib(dylibtree) if args.dylib_id: # Path from Dylib ID Load Command print(snake_instance.getPathFromDylibID()) if args.reexport_paths: # All reexported libraries paths print(*snake_instance.getReExportPaths(), sep="\n") if args.hijack_sec: # Check Dylib Hijacking protection on binary print("DYLIB HIJACKIG PROTECTION: " + str(snake_instance.checkDylibHijackingProtections(snake_instance.file_path))) if args.dylib_hijacking: # Direct & Indirect Dylib Hijacking check if args.dylib_hijacking == 'default': args.dylib_hijacking = None all_results = snake_instance.dylibHijackingScanner(args.dylib_hijacking) snake_instance.parseDylibHijackingScannerResults(all_results) if args.dylib_hijacking_a: # Show only possible vectors if args.dylib_hijacking_a == 'default': args.dylib_hijacking_a = None all_results = snake_instance.dylibHijackingScanner(args.dylib_hijacking_a) dh_check = snake_instance.isVulnDylibHijacking(all_results) if dh_check: print(dh_check) if args.prepare_dylib is not None: # Compile rogue dylib snake_instance.prepareRogueDylib(args.prepare_dylib) class SnakeIV(SnakeIII): def __init__(self, binaries, file_path): ''' When initiated, it run series of commands to extract: - all load commands - dylib loading commands - dylib ID (if exists) - rpaths (resolved) - absolute paths (@executable_path|@loader_path|@rpath resolved) Sets default Dyld Shared Cache location ''' super().__init__(binaries, file_path) self.dylib_load_commands_names = { 'LAZY_LOAD_DYLIB', 'LOAD_DYLIB', 'LOAD_UPWARD_DYLIB', 'LOAD_WEAK_DYLIB', 'PREBOUND_DYLIB', 'REEXPORT_DYLIB', } self.dylib_id_path = self.getPathFromDylibID() # Get Dylib ID for @loader_path resolving self.dylib_loading_commands, self.dylib_loading_commands_names = self.getDylibLoadCommands() # 1. Get dylib specific load commands self.rpath_list = self.resolveRunPathLoadCommands() # 2. Get LC_RPATH list self.absolute_paths = self.resolveDylibPaths() # 3. Get all dylib absolute paths dictionary {dylib_name[dylib_paths]} self.dyld_share_cache_path = '/System/Volumes/Preboot/Cryptexes/OS/System/Library/dyld/dyld_shared_cache_arm64e' def getSharedLibraries(self, only_names=True): ''' Return array of shared libraries used by the binary. When the only_names is set to False it aslo prints compatibility and current version of each library. ''' dylibs = [] for library in self.binary.libraries: if only_names: dylibs.append(library.name) else: formatted_compat_version = ".".join(map(str, library.compatibility_version)) formatted_current_version = ".".join(map(str, library.current_version)) dylibs.append(f"{library.name} (compatibility version: {formatted_compat_version}, current version: {formatted_current_version})") return dylibs def getDylibLoadCommands(self): '''Return a list of load commands that load dylibs.''' dylib_loading_commands = [] dylib_loading_commands_names = [] for cmd in self.load_commands: cmd_name = cmd.command.__name__ if cmd_name in self.dylib_load_commands_names: dylib_loading_commands.append(cmd) dylib_loading_commands_names.append(cmd_name) return dylib_loading_commands, dylib_loading_commands_names def getUnresolvedRunPathLoadCommandsPaths(self): ''' Return a list of unresolved paths (like @executable_path/Frameworks) from LC_RPATH load commands. Example return: ['/usr/lib/swift', '@executable_path/Frameworks', '@loader_path/Frameworks'] ''' return [cmd.path for cmd in self.load_commands if cmd.command.__name__ == 'RPATH'] def resolveRunPathLoadCommands(self): ''' Return a list of resolved (absolute) paths from LC_RPATH. Example return: ['/usr/lib/swift', '/Applications/Suunto.app/WrappedBundle/Frameworks', '/Applications/Suunto.app/WrappedBundle/Frameworks'] ''' executable_path = os.path.dirname(self.file_path) if self.dylib_id_path: loader_path = self.dylib_id_path else: loader_path = executable_path unresolved_LC_RPATHS = self.getUnresolvedRunPathLoadCommandsPaths() LC_RPATHS = [] for path in unresolved_LC_RPATHS: if path.startswith('@executable_path'): path = path.replace('@executable_path',executable_path) LC_RPATHS.append(path) elif path.startswith('@loader_path'): path = path.replace('@loader_path',loader_path) LC_RPATHS.append(path) else: LC_RPATHS.append(path) return LC_RPATHS def extractPathFromDylibLoadCommandStruct(self, dylib_load_command): '''Extracts the string path from a dylib load command structure.''' cmd_data = bytes(dylib_load_command.data) offset_data = cmd_data[8:] offset = int.from_bytes(offset_data[:4], byteorder=self.endianess) string_data = cmd_data[offset:] null_index = string_data.find(0) path_bytes = string_data[:null_index] path_string = path_bytes.decode('utf-8') return path_string def resolveRunPathPaths(self, path): ''' Return ordered list of resolved @rpaths for the given dylib path. Example return for self.rpath_list = ['/1/', '/2/'] and dylib path = @rpath/test.dylib [ '/1/test.dylib', '/2/test.dylib'] ''' resolved_rpaths = [] for rpath in self.rpath_list: resolved_rpaths.append(path.replace('@rpath',rpath)) return resolved_rpaths def resolveDylibPaths(self): ''' Return a dictionary of dylib_name : dylib_absolute_paths Paths are absolute (with resolved @rpath, @executable_path, @loader_path) ''' executable_path = os.path.dirname(self.file_path) if self.dylib_id_path: loader_path = self.dylib_id_path else: loader_path = executable_path absolute_paths = {} for dylib_load_command in self.dylib_loading_commands: path = self.extractPathFromDylibLoadCommandStruct(dylib_load_command) name = os.path.basename(path) if name not in absolute_paths: absolute_paths[name] = [] if path.startswith('@executable_path'): path = path.replace('@executable_path', executable_path) absolute_paths[name].append(path) elif path.startswith('@rpath'): paths = self.resolveRunPathPaths(path) absolute_paths[name].extend(paths) elif path.startswith('@loader_path'): path = path.replace('@loader_path', loader_path) absolute_paths[name].append(path) else: absolute_paths[name].append(path) return absolute_paths def checkBrokenRelativeDylibSource(self): ''' Check for bad dylib source. When Dylib is relative, but does not use @executable_path | @loader_path | @rpath. For example: mylib.dylib instead of @executable_path/mylib.dylib ''' broken_relative_dylibs = [] for _, paths in self.absolute_paths.items(): # Iterate dylibs:paths dictionary for path in paths: if not path.startswith('/'): broken_relative_dylibs.append(path) return broken_relative_dylibs def checkIfPathExists(self, path): '''Check if specified path exists on the filesystem.''' return os.path.exists(path) def checkIfPathExistsInDyldSharedCache(self, path, extracted_dyld_share_cache_directory_path): '''Return if the path exists in the DSC - you must first extract it.''' path = os.path.abspath(extracted_dyld_share_cache_directory_path) + "/" + path return self.checkIfPathExists(path) def runDyldSharedCacheExtractor(self, dyld_share_cache_path, extracted_output_path): '''Run dyld-shared-cache-extractor command.''' command = ['dyld-shared-cache-extractor', dyld_share_cache_path, extracted_output_path] subprocess.run(command, check=True) def getDylibTree(self, dyld_share_cache_path=None, extracted_output_path=None, is_extracted=0): ''' A function that inspects the dynamic dependencies of a Mach-O binary recursively (like recursive otool -L). You must use absolute path in --path if you are using --dylibtree from extracted Dyld Shared Cache. ''' if dyld_share_cache_path in [None, '']: dyld_share_cache_path = self.dyld_share_cache_path if extracted_output_path in [None, '']: extracted_output_path = 'extracted_dyld_share_cache/' extracted_output_path = os.path.abspath(extracted_output_path) # Convert to absolute path if is_extracted == '0': self.runDyldSharedCacheExtractor(dyld_share_cache_path, extracted_output_path) dylibtree = treelib.Tree() path_to_process = [self.file_path] already_checked_paths = [] not_existing_paths = [] # It could be the already_checked_paths for optimization, but for code clarity it stay. node_id = 0 dylibtree.create_node(self.file_path, node_id) while path_to_process: current_path = path_to_process.pop() if (current_path not in path_to_process) and (current_path not in already_checked_paths) and (current_path not in not_existing_paths): fat_binary = lief.MachO.parse(current_path) dylib_snake_instance = SnakeIV(fat_binary, current_path) if current_path.startswith(extracted_output_path): current_path = current_path.removeprefix(extracted_output_path) for _, dylib_paths in dylib_snake_instance.absolute_paths.items(): for path in dylib_paths: # All dylibs for current binary (current_path from existing_path_to_process) absolute_path = os.path.abspath(path) node_id += 1 filtered_nodes = list(dylibtree.filter_nodes(lambda node: node.tag == current_path)) nid_of_first_occurance_of_dylib_in_dylibtree = filtered_nodes[0].identifier # If path exist on the filesystem or DSC, add as a leaf to tree ## current_path(root) -> absolute_path(leaf) if absolute_path not in path_to_process: if dylib_snake_instance.checkIfPathExists(absolute_path): path_to_process.append(absolute_path) # Add this path to process recursively in while loop dylibtree.create_node(absolute_path, node_id, parent=nid_of_first_occurance_of_dylib_in_dylibtree) # Add a path as a leaf elif dylib_snake_instance.checkIfPathExistsInDyldSharedCache(path, extracted_output_path): dsc_path = extracted_output_path + path path_to_process.append(dsc_path) dylibtree.create_node(absolute_path, node_id, data='\033[94mDSC\033[0m', parent=nid_of_first_occurance_of_dylib_in_dylibtree) # Add a path as a leaf else: not_existing_paths.append(absolute_path) dylibtree.create_node(absolute_path, node_id, data='\033[91mWARNING - not existing path\033[0m', parent=nid_of_first_occurance_of_dylib_in_dylibtree) # If the node path (current_path) was checked, it should not be unwind again. already_checked_paths.append(current_path) already_checked_paths.append(extracted_output_path + current_path) return dylibtree def getDylibID(self): ''' Return a LC_ID_DYLIB Load Command if exists. Dyld additionally check if the FILE TYPE == MH_DYLIB. I intentionally omit this step to always extract ID. ''' for cmd in self.load_commands: if cmd.command.__name__ == 'ID_DYLIB': return cmd return None def getPathFromDylibID(self): '''Return a path stored inside the Dylib ID Load Command.''' dylib_id_lc = self.getDylibID() if dylib_id_lc: return self.extractPathFromDylibLoadCommandStruct(dylib_id_lc) return None def printTreeFromTreelib(self, tree): ''' Helper function for printing the dylibtree. It will only work with this structure because the root id is equal to 0 (tree.get_node(0)), which is not always true. I had to write this to make pretty printing with data work because, by default, tree limb does not support printing with data. Data is needed to show warnings if any library is missing on the filesystem and to inform if the library was from Dyld Share Cachce. ''' def recursivePrint(node, prefix="", last=True): data_str = f": {node.data}" if node.data else "" print(f"{prefix}{'`-- ' if last else '|-- '}{node.tag}{data_str}") children = tree.children(node.identifier) count = len(children) for i, child in enumerate(children): is_last = i == count - 1 child_prefix = f"{prefix}{' ' if last else '| '}" recursivePrint(child, child_prefix, is_last) root = tree.get_node(0) recursivePrint(root) def printDylibs(self): dylibs = self.getSharedLibraries(only_names=False) if dylibs: print(f"{self.file_path} depends on libraries:") for d in dylibs: print(f"\t{d}") else: print(f"{self.file_path} does not depend on any libraries.") def printRpathsResolved(self): '''Print all paths that @rpath can be resolved to.''' print(*self.rpath_list, sep="\n") def printRpathsUnresolved(self): print(*self.getUnresolvedRunPathLoadCommandsPaths(), sep="\n") def printResolvedDylibPaths(self): '''Prints all resolved (absolute) dylib loading commands paths.''' for _, dylib_paths in self.absolute_paths.items(): print(*dylib_paths, sep='\n') def printUnresolvedDylibPaths(self): '''Prints all unresolved (with @rpath|@executable_path|@loader_path) dylib loading commands paths.''' for dylib_load_command in self.dylib_loading_commands: print(self.extractPathFromDylibLoadCommandStruct(dylib_load_command)) def printBrokenRelativePaths(self): '''Print 'broken' relative paths from the binary (cases where the dylib source is specified for an executable directory without @executable_path)''' for broken_path in self.checkBrokenRelativeDylibSource(): print(broken_path) def getMissingPaths(self): '''Return two unique lists of missing and existing paths.''' missing_paths = [] existing_paths = [] for _, paths in self.absolute_paths.items(): for path in paths: if os.path.exists(path): existing_paths.append(path) break # Stop checking further paths for this dylib else: missing_paths.append(path) unique_missing = list(set(missing_paths)) unique_existing = list(set(existing_paths)) return unique_missing, unique_existing def checkWriteAccessMissing(self, paths): ''' Check write access for the given paths. In case the directory does not exists, traverse back till directory that exists and check write access there. Return a list of writeable directories. ''' write_accessible_paths = [] for path in paths: current_path = path if os.access(current_path, os.W_OK): write_accessible_paths.append(path) continue while current_path: current_path = os.path.dirname(current_path) if not os.path.exists(current_path): continue if os.access(current_path, os.W_OK): write_accessible_paths.append(path) break else: break return write_accessible_paths def checkWriteAccessExisting(self, paths): '''Return a list of write-accessible paths.''' write_accessible_paths = [] for path in paths: if os.access(path, os.W_OK): write_accessible_paths.append(path) return write_accessible_paths def hasLibraryValidationFlag(self, file_path): '''Check Library validation flag for given binary.''' if b'library-validation' in self.getCodeSignature(file_path): return True return False def hasDisableLibraryValidationEntitlement(self, file_path): ''' Checks if the binary has com.apple.security.cs.disable-library-validation or com.apple.private.security.clear-library-validation entitlement set. They allows loading dylibs without requiring code signing. ''' if self.checkIfEntitlementIsUsed('com.apple.security.cs.disable-library-validation', 'true', file_path) or self.checkIfEntitlementIsUsed('com.apple.private.security.clear-library-validation','true', file_path): return True return False def getDyldSharedCacheDylibsPaths(self, dsc_path): ''' Parse Dyld Shared Cache using ipsw to extract dylib paths. Ref: https://blacktop.github.io/ipsw/docs/guides/dyld/ ''' if dsc_path == None: dsc_path = self.dyld_share_cache_path command = f"ipsw dyld info {dsc_path} -l -j >> /tmp/dyld_shared_cache_temp_1234.json" subprocess.run(command, shell=True, check=True) with open('/tmp/dyld_shared_cache_temp_1234.json', 'r') as file: data = json.load(file) os.remove('/tmp/dyld_shared_cache_temp_1234.json') # jq -r '.dylibs[].name' dsc.json paths = [dylib['name'] for dylib in data.get('dylibs', [])] return paths def printDyldSharedCacheDylibsPaths(self, dsc_path): '''Print Dyld paths from Dyld Shared Cache.''' if dsc_path == None: dsc_path = self.dyld_share_cache_path paths = self.getDyldSharedCacheDylibsPaths(dsc_path) for path in paths: print(path) def checkDylibHijackingProtections(self, file_path): ''' Check protections against dylib hijacking. Return True if protected (has library validation ON). ''' # Check if 'com.apple.security.cs.disable-library-validation' or 'com.apple.private.security.clear-library-validation' entitlements are present and set to true - INSECURE. has_insecure_entitlement = self.hasDisableLibraryValidationEntitlement(file_path) # Check if Library validation or Hardened runtime is active - SECURE is_hardened_runtime_active = self.hasHardenedRuntimeFlag(file_path) is_library_validation_active = self.hasLibraryValidationFlag(file_path) if has_insecure_entitlement: # Entitlements disables protections return False elif is_hardened_runtime_active or is_library_validation_active: # If there are no entitlements and HR or LV exists, then protections is ON return True else: # If there are no insecure entitlements, but there are also no HR or LV, there are no protections return False def dylibHijackingScanner(self, dyld_share_cache_path): ''' Direct and Indirect Dylib Hijacking Scanner - return dictionary of results for main binary and each dependancy. Save JSON format to /tmp/dylib_hijacking_log.json. Return results dictionary. ''' if dyld_share_cache_path in [None, '']: dyld_share_cache_path = self.dyld_share_cache_path dsc_paths = self.getDyldSharedCacheDylibsPaths(dyld_share_cache_path) already_checked_paths = [] all_results = {} path_to_process = [self.file_path] while path_to_process: current_path = path_to_process.pop() result = { 'is_protected' : bool, 'writeable_missing_paths' : [], 'writeable_existing_paths' : [] } if (current_path not in already_checked_paths) and (current_path not in dsc_paths): fat_binary = lief.MachO.parse(current_path) dylib_snake_instance = SnakeIV(fat_binary, current_path) missing_paths, existing_paths = dylib_snake_instance.getMissingPaths() result['writeable_missing_paths'] = dylib_snake_instance.checkWriteAccessMissing(missing_paths) result['writeable_existing_paths'] = dylib_snake_instance.checkWriteAccessExisting(existing_paths) result['is_protected'] = dylib_snake_instance.checkDylibHijackingProtections(dylib_snake_instance.file_path) already_checked_paths.append(current_path) path_to_process.extend(existing_paths) all_results[current_path] = result json_file_path = '/tmp/dylib_hijacking_log.json' with open(json_file_path, 'a') as json_file: json.dump(all_results, json_file) return all_results def isVulnDylibHijacking(self, all_results): ''' Automatically decide if target is vulnerable to Dylib Hijacking. Returns vulnerability info or None if protected. ''' root_binary = True info = '' for current_path, result in all_results.items(): if root_binary and result['is_protected']: return # Root binary is protected - not vuln if not result['is_protected']: if result['writeable_existing_paths'] or result['writeable_missing_paths']: if root_binary: info += (f'\033[91mVULNERABLE ROOT BINARY\033[0m: {current_path}\n') root_binary = False else: info += (f'\033[91mVULNERABLE DEPENDENCY\033[0m: {current_path}\n') if result['writeable_existing_paths']: info += (f"\033[91mWRITEABLE EXISTING PATHS\033[0m: {', '.join(map(str, result['writeable_existing_paths']))}\n") if result['writeable_missing_paths']: info += (f"\033[91mWRITEABLE MISSING PATHS\033[0m: {', '.join(map(str, result['writeable_missing_paths']))}\n") if info: return info else: return def parseDylibHijackingScannerResults(self, all_results): ''' Print the dylibHijackingScanner results in a nice format. ''' first_iteration = True for current_path, result in all_results.items(): if first_iteration: if result['is_protected']: print(f"\033[92mROOT BINARY PROTECTED\033[0m: {current_path}") else: print(f"\033[91mROOT BINARY NOT PROTECTED\033[0m: {current_path}") first_iteration = False else: if result['is_protected']: print(f"\033[92mPROTECTED\033[0m: {current_path}") else: print(f"\033[91mNOT PROTECTED\033[0m: {current_path}") if result['writeable_existing_paths']: print(f"\033[91mWRITEABLE EXISTING PATHS\033[0m: {', '.join(map(str, result['writeable_existing_paths']))}") if result['writeable_missing_paths']: print(f"\033[91mWRITEABLE MISSING PATHS\033[0m: {', '.join(map(str, result['writeable_missing_paths']))}") print("-"*28) def getReExportLoadCommands(self): ''' Return a list of REEXPORT_DYLIB Load Commands if exists. ''' reexport_load_commands = [] for cmd in self.load_commands: if cmd.command.__name__ == 'REEXPORT_DYLIB': reexport_load_commands.append(cmd) return reexport_load_commands def getReExportPaths(self): '''Return paths stored inside the REEXPORT_DYLIB Load Commands.''' reexport_load_commands = self.getReExportLoadCommands() paths = [] if reexport_load_commands: for load_command in reexport_load_commands: paths.append(self.extractPathFromDylibLoadCommandStruct(load_command)) return paths def getImportedSymbols(self): '''Return a dictionary of imported symbols and names of external libraries where they come from.''' imported_symbols = {} for symbol in self.binary.imported_symbols: binding_info = symbol.binding_info if binding_info: dylib = binding_info.library if dylib: imported_symbols[symbol.name] = dylib.name return imported_symbols def printImportedSymbols(self): ''' Parse getImportedSymbols dictionary in grepable form and print it. Symbol names are grouped (sorted) by library. Example output: symbol_name : library1 symbol_name : library1 symbol_name : library2 symbol_name : library3 ''' imported_symbols = self.getImportedSymbols() grouped_symbols = {} # Group symbols by unresolved library path for symbol_name, unresolved_library_path in imported_symbols.items(): if unresolved_library_path not in grouped_symbols: grouped_symbols[unresolved_library_path] = [] grouped_symbols[unresolved_library_path].append(symbol_name) # Print the grouped symbols for unresolved_library_path, symbols in grouped_symbols.items(): for symbol_name in symbols: print(f'{symbol_name} : {unresolved_library_path}') def getImportedSymbolsFromTargetLib(self, external_library_name): ''' This function is like a `cat printImportedSymbols | grep external_library`. Filter imported symbols in binary (--path binary) to only those from specified external library (--preapre_dylib external_library_name). https://lief-project.github.io/doc/stable/api/python/macho.html#binary https://lief-project.github.io/doc/stable/api/python/macho.html#binding-info https://lief-project.github.io/doc/stable/api/python/macho.html#dylibcommand ''' imported_symbols = self.getImportedSymbols() grep_result = [] for symbol_name, unresolved_library_path in imported_symbols.items(): if external_library_name in unresolved_library_path: grep_result.append(symbol_name) return grep_result def prepareRogueDylib(self, target_library_path=''): ''' Compile m.dylib which by default: 1. Prints log about successful injection to stdout & stderr syslog. 2. If the binary is SUID, sets RUID to EUID and prints user ID. ''' file_name_c = 'm.c' source_code = SourceCodeManager.dylib_hijacking output_filename = 'm.dylib' flag_list = ['-dynamiclib'] if target_library_path: imported_sybols = self.getImportedSymbolsFromTargetLib(target_library_path) else: imported_sybols = [] if imported_sybols: for symbol in imported_sybols: if symbol.startswith('_'): symbol = symbol[1:] function_to_add = f'\nvoid {symbol}(void){{}}' source_code += function_to_add SourceCodeManager.clangCompilerWrapper(file_name_c, source_code, output_filename, flag_list) ### --- V. DYLD --- ### class DyldProcessor: def __init__(self): '''This class contains part of the code from the main() for the SnakeV: Dyld.''' pass def process(self, args): if args.is_built_for_sim: # Check if binary is build for a simulator snake_instance.printIsBuiltForSimulator() if args.get_dyld_env: # Extract DYLD environment variables from the loader binary snake_instance.printDyldEnv() if args.compiled_with_dyld_env: # Print Environment variables from the LC_DYLD_ENVIRONMENT snake_instance.printDyldEnvLoadCommands() if args.has_interposing: # Print if binary has interposing sections print("INTERPOSING: " + str(snake_instance.hasInterposing())) if args.interposing_symbols: # Print all replacement symbols from the __interpose section snake_instance.printInterposingSymbols() class SnakeV(SnakeIV): def __init__(self, binaries, file_path): super().__init__(binaries, file_path) self.platforms = { 1: 'PLATFORM_MACOS', 2: 'PLATFORM_IOS', 3: 'PLATFORM_TVOS', 4: 'PLATFORM_WATCHOS', 5: 'PLATFORM_BRIDGEOS', 6: 'PLATFORM_MACCATALYST', 7: 'PLATFORM_IOSSIMULATOR', 8: 'PLATFORM_TVOSSIMULATOR', 9: 'PLATFORM_WATCHOSSIMULATOR', 10: 'PLATFORM_DRIVERKIT' } # https://github.com/Karmaz95/Snake_Apple/blob/main/IV.%20Dylibs/macos/loader.h#L1275 def isBuiltForSimulator(self): ''' Function for --is_built_for_sim flag. https://lief-project.github.io/doc/stable/api/python/macho.html#lief.MachO.BuildVersion.PLATFORMS Returns True if platform is in : #define PLATFORM_IOSSIMULATOR 7 #define PLATFORM_TVOSSIMULATOR 8 #define PLATFORM_WATCHOSSIMULATOR 9. ''' simulator_platforms = [7,8,9] platform_value = self.binary.build_version.platform.value if platform_value in simulator_platforms: return True, platform_value elif platform_value > 10: return None, platform_value else: return False, platform_value def printIsBuiltForSimulator(self): ''' Print text instead of True|False from the isBuiltForSimulator return. Example outputs: test platform is PLATFORM_IOSSIMULATOR -> built for simulator. executable platform is PLATFORM_MACOS -> not built for simulator ''' name = os.path.basename(self.file_path) platform_check, platform_value = self.isBuiltForSimulator() if platform_check == True: print(f'{name} platform is \033[94m{self.platforms[platform_value]}\033[0m\033[91m -> built for simulator\033[0m. ') elif platform_check == None: print(f'{name} is build for UNKNOWN platform -> \033[94m{platform_value}\033[0m') else: print(f'{name} platform is \033[94m{self.platforms[platform_value]}\033[0m\033[92m -> not built for simulator\033[0m') def getDyldEnv(self): '''Return a list of DYLD environment variables from the binary.''' dyld_env = [] strings_from_CSTRING = self.getStringSection() for s in strings_from_CSTRING: if s.startswith('DYLD_') and '/' not in s: # Exclude DYLD_$ paths (that starts and ends with DYLD_) if s.endswith('DYLD_'): continue # Remove spaces and all after the first occurrence of space s = s.split(' ')[0].strip() if s not in dyld_env: dyld_env.append(s) return dyld_env def printDyldEnv(self): '''Print DYLD environment variables from the binary.''' dyld_env = self.getDyldEnv() if dyld_env: print(*dyld_env, sep='\n') else: print("No DYLD environment variables found.") def enumDyldEnvLoadCommands(self): '''Check if binary has DYLD_ENVIRONMENT load commands.''' all_dyld_env = [] for cmd in self.load_commands: if cmd.command.__name__ == 'DYLD_ENVIRONMENT': all_dyld_env.append(cmd) return all_dyld_env def printDyldEnvLoadCommands(self): '''Print DYLD_ENVIRONMENT load commands.''' all_dyld_env = self.enumDyldEnvLoadCommands() if all_dyld_env: for cmd in all_dyld_env: print(cmd.value) def hasInterposing(self): '''Check if binary has interposing sections.''' for section in self.binary.sections: if section.name == "__interpose": return True return False def getInterposingSymbolsAddresses(self): '''Get replacement symbols addresses from the __interpose section.''' interposing_symbols_addresses = [] bit_mask = 0xffffffff if self.hasInterposing(): for section in self.binary.sections: if section.name == "__interpose": for i in range(0, len(section.content), 16): address = int.from_bytes(section.content[i:i+8], byteorder=self.endianess) interposing_symbols_addresses.append(address) # Remove binary virtual address base to get the symbol offset only ['0x3f54'] instead of ['0x10000000003f54'] i = 0 for addr in interposing_symbols_addresses: interposing_symbols_addresses[i] = addr & bit_mask i+=1 return interposing_symbols_addresses def getInterposingSymbols(self): '''Get all replacement symbols from the __interpose section.''' interposing_symbols_addresses = self.getInterposingSymbolsAddresses() interposing_symbols_names = [] if interposing_symbols_addresses: for symbol in self.getSymbols(): if symbol.value in interposing_symbols_addresses: interposing_symbols_names.append(symbol.name) return interposing_symbols_names, interposing_symbols_addresses def printInterposingSymbols(self): '''Print all replacement symbols from the __interpose section.''' symbol_names, symbol_addrs = self.getInterposingSymbols() for symbol_name, symbol_addrs in zip(symbol_names, symbol_addrs): print(f"{(symbol_name).ljust(32)} {hex(symbol_addrs)}") ### --- VI. AMFI --- ### class AMFIProcessor: def __init__(self): '''This class contains part of the code from the main() for the SnakeVI: AMFI.''' pass def process(self, args): if args.dump_prelink_info is not None: # nargs="?", const='PRELINK_info.txt' # Dump '__PRELINK_INFO,__info' to a given file (default: 'PRELINK_info.txt') snake_instance.dumpPrelink_info(args.dump_prelink_info) if args.dump_prelink_text is not None: # Dump '__PRELINK_TEXT,__text' to a given file (default: 'PRELINK_text.txt') snake_instance.dumpPrelink_text(args.dump_prelink_text) if args.dump_prelink_kext is not None: # Dump prelinked KEXT from decompressed Kernel Cache to a file named: prelinked_{kext_name}.bin snake_instance.dumpKernelExtensionFromPRELINK_TEXT(args.dump_prelink_kext) if args.kext_prelinkinfo: # Print _Prelink properties from PRELINK_INFO,__info for a give kext snake_instance.printParsedPRELINK_INFO_plist(args.kext_prelinkinfo) if args.kmod_info: # Print parsed kmod_info for the given kext snake_instance.printParsedkmod_info(args.kmod_info) if args.kext_entry: # Print kext entrypoint snake_instance.printKextEntryPoint(args.kext_entry) if args.kext_exit: # Print kext exitpoint snake_instance.printKextExitPoint(args.kext_exit) if args.mig: # Search for MIG subsystem and prints message handlers snake_instance.printMIG() if args.has_suid: # Print file SUID status snake_instance.printHasSetUID() if args.has_sgid: # Print file SGID status snake_instance.printHasSetGID() if args.has_sticky: # Print file sticky bit status snake_instance.printStickyBit() if args.injectable_dyld: # Static check for DYLD_INSERT_LIBRARIES snake_instance.printCheckDyldInsertLibraries() if args.test_insert_dylib: # INVASIVE check for DYLD_INSERT_LIBRARIES snake_instance.printTestDyldInsertLibraries() if args.test_prune_dyld: # INVASIVE check for DYLD_PRINT_INITIALIZERS (if DEV are cleared) snake_instance.printTestPruneDyldEnv() if args.test_dyld_print_to_file: # INVASIVE check for DYLD_PRINT_TO_FILE snake_instance.printTestDyldPrintToFile() if args.test_dyld_SLC: # INVASIVE check for DYLD_SHARED_CACHE_DIR snake_instance.printTestDyldSLC() class SnakeVI(SnakeV): def __init__(self, binaries, file_path): super().__init__(binaries, file_path) # This map is just a helper for --dump_kext so the user can specify different names for the same kext. # For instance, amfi instead of AppleMobileFileIntegrity.kext self.kext_map = { 'amfi' : 'applemobilefileintegrity', 'com.apple.driver.applemobilefileintegrity' : 'applemobilefileintegrity', 'applemobilefileintegrity.kext' : 'applemobilefileintegrity', } def loadPRELINK_INFOFromFile(self, prelink_info_filename): # Not used yet. ''' Read PRELINK_INFO,__info section from file (with alignment). The last line in the dumped section plist is broken, because of alignment. This function remove it so the plistlib.loads work. It returns loaded PLIST {prelink_info_plist}. ''' prelink_info_plist_bytes = self.readBytesFromFile(prelink_info_filename) prelink_as_bytes_without_last_line = self.removeNullBytesAlignment(prelink_info_plist_bytes) prelink_info_plist = plistlib.loads(prelink_as_bytes_without_last_line) return prelink_info_plist def calcTwoComplement64(self, value): ''' Convert negative int to hex representation. ''' return hex((value + (1 << 64)) % (1 << 64)) def removeNullBytesAlignment(self, string_as_bytes): ''' The last line in the PLISTs and other files dumped from memory will almost always be aligned with 0x00 bytes. This function: Detects lines in a given bytes {string_as_bytes}. Removes the last line. Returns a new {string_as_bytes}. ''' decoded_string = string_as_bytes.decode('utf-8') decoded_string_without_last_line = decoded_string[:decoded_string.rfind('\n')] string_as_bytes_without_last_line = decoded_string_without_last_line.encode() return string_as_bytes_without_last_line def dumpPrelink_info(self, filename): ''' Dump '__PRELINK_INFO,__info' to a given file (default: 'PRELINK_info.txt') ''' segment_name = '__PRELINK_INFO' section_name = '__info' if self.dumpSection(segment_name, section_name, filename): print("SUCCESS: __PRELINK_INFO,__info dump") def dumpPrelink_text(self, filename): ''' Dump '__PRELINK_TEXT,__text' to a given file (default: 'PRELINK_text.txt') ''' segment_name = '__PRELINK_TEXT' section_name = '__text' if self.dumpSection(segment_name, section_name, filename): print("SUCCESS: __PRELINK_TEXT,__text dump") def extractPRELINK_INFO_plist(self): ''' Extract '__PRELINK_INFO,__info' and return it. ''' segment_name = '__PRELINK_INFO' section_name = '__info' extracted_bytes = self.extractSection(segment_name, section_name) return extracted_bytes def parsePRELINK_INFO_plist(self, kext_name): ''' Extract PLIST properties values from '__PRELINK_INFO,__info' section for the given {kext_name}: _PrelinkBundlePath _PrelinkExecutableLoadAddr _PrelinkExecutableRelativePath _PrelinkExecutableSize _PrelinkExecutableSourceAddr _PrelinkKmodInfo ''' #prelink_info_plist = self.loadPRELINK_INFO(prelink_info_filename) # For loading PRELINK_INFO from file prelink_as_bytes = self.extractPRELINK_INFO_plist() prelink_as_bytes_without_last_line = self.removeNullBytesAlignment(prelink_as_bytes) prelink_info_plist = plistlib.loads(prelink_as_bytes_without_last_line) kext_name = kext_name.lower() if kext_name in self.kext_map: kext_name = self.kext_map[kext_name] # Iterate over the parsed dictionary for item in prelink_info_plist['_PrelinkInfoDictionary']: PrelinkExecutableRelativePath = item.get('_PrelinkExecutableRelativePath', '').lower() # Check if the '_PrelinkExecutableRelativePath' contains {kext_name} in its path if kext_name in PrelinkExecutableRelativePath: # Extract the desired keys and their corresponding values bundle_path = item.get('_PrelinkBundlePath') executable_load_addr = str(item.get('_PrelinkExecutableLoadAddr')).lower() if executable_load_addr.startswith("0x"): executable_load_addr = int(executable_load_addr, 16) elif executable_load_addr.startswith("-"): executable_load_addr = self.calcTwoComplement64(int(executable_load_addr)) executable_relative_path = item.get('_PrelinkExecutableRelativePath') executable_size = str(item.get('_PrelinkExecutableSize')).lower() if executable_size.startswith("0x"): executable_size = int(executable_size, 16) elif executable_size.startswith("-"): executable_size = self.calcTwoComplement64(int(executable_size)) source_addr = str(item.get('_PrelinkExecutableSourceAddr')).lower() if source_addr.startswith("0x"): source_addr = int(source_addr, 16) elif source_addr.startswith("-"): source_addr = self.calcTwoComplement64(int(source_addr)) kmod_info = str(item.get('_PrelinkKmodInfo')).lower() if kmod_info.startswith("0x"): kmod_info = int(kmod_info, 16) elif kmod_info.startswith("-"): kmod_info = self.calcTwoComplement64(int(kmod_info)) return bundle_path, executable_load_addr, executable_relative_path, executable_size, source_addr, kmod_info def printParsedPRELINK_INFO_plist(self, kext_name): ''' Print extracted properties for PRELINK_INFO Plist for a given kext. ''' bundle_path, executable_load_addr, executable_relative_path, executable_size, source_addr, kmod_info = self.parsePRELINK_INFO_plist(kext_name) print(f'_PrelinkBundlePath: {bundle_path}') print(f'_PrelinkExecutableLoadAddr: {executable_load_addr}') print(f'_PrelinkExecutableRelativePath: {executable_relative_path}') print(f'_PrelinkExecutableSize: {hex(int(executable_size))}') print(f'_PrelinkExecutableSourceAddr: {source_addr}') print(f'_PrelinkKmodInfo: {kmod_info}') def dumpKernelExtensionFromPRELINK_TEXT(self, kext_name): ''' Dump prelinked KEXT {kext_name} from decompressed Kernel Cache PRELINK_TEXT segment -p {file_path} to a file named: prelinked_{kext_name}.bin ''' segment_section = '__PRELINK_TEXT,__text' if not self.hasSection(segment_section): # If segment does not exist - break print(f'Specified binary file does not have {segment_section} - the extension was not dumped.') return False _, kext_load_addr, _, kext_size, source_addr, _ = self.parsePRELINK_INFO_plist(kext_name) kext_load_addr = int(kext_load_addr, 16) kext_size = int(kext_size, 16) output_path = f'prelinked_{kext_name}.bin' kext_offset = self.calcRealAddressFromVM(kext_load_addr) self.dumpData(kext_offset, kext_size, output_path) def parsekmod_info(self, kext_name): ''' Parse kmod_info structure for the given {kext_name} from Kernel Cache ''' _, _, _, _, _, kmod_info_vm_addr = self.parsePRELINK_INFO_plist(kext_name) kmod_info_in_file = self.calcRealAddressFromVM(kmod_info_vm_addr) kmod_info_size = ctypes.sizeof(AppleStructuresManager.kmod_info) extracted_kmod_info_bytes = self.extractBytesAtOffset(kmod_info_in_file, kmod_info_size) # debug + #Utils.printQuadWordsLittleEndian64(extracted_kmod_info_bytes) # debug - kmod_info_as_dict = AppleStructuresManager.kmod_info.parse(extracted_kmod_info_bytes) return kmod_info_as_dict def printParsedkmod_info(self, kext_name): ''' Printing function for --kmod_info ''' kmod_info_as_dict = self.parsekmod_info(kext_name) for k, v in kmod_info_as_dict.items(): print(f'{k.ljust(16)}: {v}') def calcKextEntryPoint(self, kext_name): ''' Calculate the __start for the given {kext_name} Kernel Extension ''' kmod_info_as_dict = self.parsekmod_info(kext_name) start = int(kmod_info_as_dict['start'], 16) & 0xFFFFFFFF kernelcache_text_segment = self.getSegment('__TEXT') kernelcache_text_segment_base = kernelcache_text_segment.virtual_address return start + kernelcache_text_segment_base def printKextEntryPoint(self, kext_name): ''' Printing function for --kext_entry flag. ''' kext_entrypoint = hex(self.calcKextEntryPoint(kext_name)) print(f'{kext_name} entrypoint: {kext_entrypoint}') def calcKextExitPoint(self, kext_name): ''' Calculate the __stop for the given {kext_name} Kernel Extension ''' kmod_info_as_dict = self.parsekmod_info(kext_name) stop = int(kmod_info_as_dict['stop'], 16) & 0xFFFFFFFF kernelcache_text_segment = self.getSegment('__TEXT') kernelcache_text_segment_base = kernelcache_text_segment.virtual_address return stop + kernelcache_text_segment_base def printKextExitPoint(self, kext_name): ''' Printing function for --kext_exit flag. ''' kext_exitpoint = hex(self.calcKextEntryPoint(kext_name)) print(f'{kext_name} exitpoint: {kext_exitpoint}') def parseMIG(self): ''' Search for MIG subsystem messages. I was using this Hopper script as an inspiration: https://github.com/knightsc/hopper/blob/master/scripts/MIG%20Detect.py Returns a dictionary like: {'_MIG_subsystem_1000': {'_MIG_msg_1000': routine_for_msg}} ''' va_start = self.getVirtualMemoryStartingAddress() mig_subsystem_size = ctypes.sizeof(AppleStructuresManager.mig_subsystem) routine_descriptor_size = ctypes.sizeof(AppleStructuresManager.routine_descriptor) mig_subsystems = {} # The MIG should be in __DATA,__const | __DATA_CONST,__const | __CONST,__constdata, but it is not always the case. # Great example is decompressed kernelcache, there are no __const section. Conclusion, would be to iterate over each segment, but there is a problem with alignment. for section in self.binary.sections: if ('const' in section.name):# and 'DATA' in section.segment.name): section_bytes = section.content.tobytes() section_size = section.size alignment = pow(2,section.alignment) # Loop through section bytes using alignment to speed up current_offset = 0 while current_offset < section_size: chunk = section_bytes[current_offset:current_offset+mig_subsystem_size] mig_subsystem_dict = AppleStructuresManager.mig_subsystem.parse(chunk) number_of_msgs = mig_subsystem_dict['end'] - mig_subsystem_dict['start'] # Check for possible mig_subsystem structure: if (number_of_msgs > 0 and number_of_msgs < 1024 and mig_subsystem_dict['server'] != 0 and mig_subsystem_dict['start'] > 0 and mig_subsystem_dict['end'] > 0 and mig_subsystem_dict['reserved'] == 0 and mig_subsystem_dict['routine_0'] == 0): ''' # print(f'{hex(mig_subsystem_dict["server"])} {hex(mig_subsystem_dict["start"])}') # At this stage I get 0x8028000000007e74 instead of 0x100007e74 and I do not know why. The same goes for every impl_routine later too... # I can manually repair it by: & 0xffff | __TEXT # It is temp fix, there must be a "proper way" - todo ''' mig_subsystem_dict['server'] = mig_subsystem_dict['server'] & 0xffff | va_start # Fix according to the above comment mig_subsystem_number = mig_subsystem_dict['start'] subsystem_name = "MIG_subsystem_{0}".format(mig_subsystem_number) mig_subsystems[subsystem_name] = {} current_offset += mig_subsystem_size # If mig_subsystem structure was found, iterate over all routines msg = 0 while msg < number_of_msgs: routine_name = "MIG_msg_{0}".format(mig_subsystem_number+msg) chunk = section_bytes[current_offset:current_offset+routine_descriptor_size] routine_descriptor_dict = AppleStructuresManager.routine_descriptor.parse(chunk) if routine_descriptor_dict['impl_routine'] != 0: routine_descriptor_dict['impl_routine'] = routine_descriptor_dict['impl_routine'] & 0xffff | va_start # Fix like subsystem mig_subsystems[subsystem_name].update({routine_name: routine_descriptor_dict}) current_offset += routine_descriptor_size msg += 1 continue # To find more subsystems we continue the parent while without adding below alignment, because we added routine_descriptor_size current_offset += alignment return(mig_subsystems) def printMIG(self): ''' Iterates over each subsystem and its associated messages, printing them in the nice format. ''' mig_subsystems = self.parseMIG() for subsystem, messages in mig_subsystems.items(): print(subsystem + ":") for message, details in messages.items(): print(f"- {message}: {hex(details['impl_routine'])}") def hasSetUID(self): """ Check if a file has the SUID (Set User ID) bit set. Args: filename (str): Path to the file to be checked. Returns: bool: True if SUID bit is set, False otherwise. """ st_mode = os.stat(self.file_path).st_mode return bool(st_mode & stat.S_ISUID) def hasSetGID(self): """ Check if a file has the setgid (Set Group ID) bit set. Args: filename (str): Path to the file to be checked. Returns: bool: True if setgid bit is set, False otherwise. """ st_mode = os.stat(self.file_path).st_mode return bool(st_mode & stat.S_ISGID) def hasStickyBit(self): """ Check if a file has the sticky bit set. Args: filename (str): Path to the file to be checked. Returns: bool: True if sticky bit is set, False otherwise. """ st_mode = os.stat(self.file_path).st_mode return bool(st_mode & stat.S_ISVTX) def printHasSetUID(self): print(f'SUID: {self.hasSetUID()}') def printHasSetGID(self): print(f'SGID: {self.hasSetGID()}') def printStickyBit(self): print(f'STICKY: {self.hasStickyBit()}') def hasAllowDEV(self, file_path): ''' Checks if the binary has com.apple.security.cs.allow-dyld-environment-variables. This allow for Dyld Environment Variables. ''' if self.checkIfEntitlementIsUsed('com.apple.security.cs.allow-dyld-environment-variables', 'true', file_path): return True return False def checkDyldInsertLibraries(self): ''' Check if binary is vulnerable to code injection using DYLD_INSERT_LIBRARIES. ''' cs_flags = self.getCodeSignatureFlags() if cs_flags & 0x2800: # CS_RESTRICT | CS_REQUIRE_LV return False if self.hasSetUID() or self.hasSetGID() or self.hasRestrictSegment(): # SUID | GUID | __RESTRICT,__restrict return False has_insecure_entitlements_combination = self.hasDisableLibraryValidationEntitlement(self.file_path) and self.hasAllowDEV(self.file_path) if (cs_flags & 0x10000) and (not has_insecure_entitlements_combination): # CS_RUNTIME without disabled LV and allowed DEV through entitlements return False return True def printCheckDyldInsertLibraries(self): #print(f'{self.file_path} injectable DYLD_INSERT_LIBRARIES: {self.checkDyldInsertLibraries()}') print(f'Injectable DYLD_INSERT_LIBRARIES: {self.checkDyldInsertLibraries()}') def listenSyslog(self, test_string, test_string_found, stop_event, timeout=2): ''' Function to listen (for 2 seconds by default) to macOS system logs for a specific string. ''' # Run the log command to retrieve system log messages process = subprocess.Popen(['log', 'stream', '--timeout', str(timeout)], stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True) for line in process.stdout: if test_string in line: test_string_found.set() return if stop_event.is_set(): return def testDyldInsertLibraries(self): ''' Checking if DYLD_INSERT_LIBRARIES is allowed. INVASIVE: 0. Check if /tmp/crimson_stalker.dylib exists. 1. If not - the library /tmp/crimson_stalker.dylib is compiled. 2. Binary is executed with DYLD_INSERT_LIBRARIES=/tmp/crimson_stalker.dylib 3. Library is NOT REMOVED it stays in /tmp/ in case of massive checks with loops. ''' stalker_path = '/tmp/crimson_stalker.dylib' env_variable = f'DYLD_INSERT_LIBRARIES={stalker_path}' test_string = 'crimson_stalker library injected into ' # Compile dylib if not exist: if not os.path.exists(stalker_path): file_name_c = '/tmp/crimson_stalker.c' source_code = SourceCodeManager.crimson_stalker output_filename = stalker_path flag_list = ['-dynamiclib'] SourceCodeManager.clangCompilerWrapper(file_name_c, source_code, output_filename, flag_list) # Create a threading event to signal when the test string is found in syslog or to stop listenSyslog thread (using Event as a flag and .set() as a switch) test_string_found = threading.Event() # Used in listenSyslog -> when test_string_found.set() is called, it is final check if test_string was found in syslogs. stop_event = threading.Event() # Used in this function -> when stop_event.set() is called below, it inform listenSyslog to stop.s # Start listening for syslog messages in a separate thread syslog_listener_thread = threading.Thread(target=self.listenSyslog, args=(test_string, test_string_found, stop_event)) syslog_listener_thread.start() # To avoid Race Codition false positives because syslog_listener_thread just started # We must wait for at least 0.1 for listenSyslog to start reading logs # Then we can execute the command below without a fear it will be omited in by the syslog_listener_thread. time.sleep(0.2) # 0.2 here and 2 for the timeout in listenSyslog is enough # Execute the command and capture stdout and stderr command = f'{env_variable} {self.file_path}' process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, shell=True) stdout, stderr = process.communicate() # Wait for the subprocess to finish process.wait() stdout = stdout.decode('utf-8') stderr = stderr.decode('utf-8') # Check if the test string was found in stdout (it should not appear in stderr, but I check for that, you never know :D) if (test_string in stdout) or (test_string in stderr): stop_event.set() return True # Wait for the thread to finish syslog_listener_thread.join() # Check if the test string was found in syslog if test_string_found.is_set(): # return True return False def printTestDyldInsertLibraries(self): print(f'DYLD_INSERT_LIBRARIES is allowed: {self.testDyldInsertLibraries()}') def testPruneDyldEnv(self): ''' Checking if Dyld Environment Variables are cleared (INVASIVE - the binary is executed) ''' env_variable = 'DYLD_PRINT_INITIALIZERS=1' test_string = 'running initializer ' # Execute the command and capture stdout and stderr command = f'{env_variable} {self.file_path}' process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, shell=True) stdout, stderr = process.communicate() stdout = stdout.decode('utf-8') stderr = stderr.decode('utf-8') if test_string in stderr: return False return True def printTestPruneDyldEnv(self): #print(f'{self.file_path} DEV Pruned: {self.testPruneDyldEnv()}') print(f'DEV Pruned: {self.testPruneDyldEnv()}') def testDyldPrintToFile(self): ''' Checking if DYLD_PRINT_TO_FILE Dyld Environment Variables works. INVASIVE: 1. The binary is executed. 2. The file /tmp/crimson_1029384756_testDyldPrintToFile.txt is created if env works. 3. The file is then removed ''' test_file_path = '/tmp/crimson_1029384756_testDyldPrintToFile.txt' env_variable = f'DYLD_PRINT_TO_FILE={test_file_path}' # Execute the command and capture stdout and stderr command = f'{env_variable} {self.file_path}' process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, shell=True) stdout, stderr = process.communicate() #process.wait() stdout = stdout.decode('utf-8') stderr = stderr.decode('utf-8') if os.path.exists(test_file_path): os.remove(test_file_path) return True return False def printTestDyldPrintToFile(self): print(f'DYLD_PRINT_TO_FILE allowed: {self.testDyldPrintToFile()}') def testDyldSLC(self): ''' Checking if DYLD_SHARED_REGION=private Dyld Environment Variables works and code can be injected using DYLD_SHARED_CACHE_DIR. INVASIVE: 1. The binary is executed. 2. DYLD_SHARED_CACHE_DIR=/tmp - this should trigger error, as there are no SLC in tmp. 3. If there is an error "dyld private shared cache could not be found" the binary is vulnerable. ''' test_file_path = '/tmp' env_variable_1 = f'DYLD_SHARED_CACHE_DIR={test_file_path}' env_variable_2 = f'DYLD_SHARED_REGION=private' # Execute the command and capture stdout and stderr command = f'{env_variable_1} {env_variable_2} {self.file_path}' process = subprocess.Popen(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE, shell=True) stdout, stderr = process.communicate() stdout = stdout.decode('utf-8') stderr = stderr.decode('utf-8') if 'dyld private shared cache could not be found' in stderr: return True return False def printTestDyldSLC(self): print(f'DYLD_SHARED_CACHE_DIR allowed: {self.testDyldSLC()}') ### --- ARGUMENT PARSER --- ### class ArgumentParser: def __init__(self): '''Class for parsing arguments from the command line. I decided to remove it from main() for additional readability and easier code maintenance in the VScode''' self.parser = argparse.ArgumentParser(description="Mach-O files parser for binary analysis") self.addGeneralArgs() self.addMachOArgs() self.addCodeSignArgs() self.addChecksecArgs() self.addDylibsArgs() self.addDyldArgs() self.addAMFIArgs() def addGeneralArgs(self): self.parser.add_argument('-p', '--path', required=True, help="Path to the Mach-O file") def addMachOArgs(self): macho_group = self.parser.add_argument_group('MACH-O ARGS') macho_group.add_argument('--file_type', action='store_true', help="Print binary file type") macho_group.add_argument('--header_flags', action='store_true', help="Print binary header flags") macho_group.add_argument('--endian', action='store_true', help="Print binary endianess") macho_group.add_argument('--header', action='store_true', help="Print binary header") macho_group.add_argument('--load_commands', action='store_true', help="Print binary load commands names") macho_group.add_argument('--has_cmd', metavar='LC_MAIN', help="Check of binary has given load command") macho_group.add_argument('--segments', action='store_true', help="Print binary segments in human-friendly form") macho_group.add_argument('--has_segment', help="Check if binary has given '__SEGMENT'", metavar='__SEGMENT') macho_group.add_argument('--sections', action='store_true', help="Print binary sections in human-friendly form") macho_group.add_argument('--has_section', help="Check if binary has given '__SEGMENT,__section'", metavar='__SEGMENT,__section') macho_group.add_argument('--symbols', action='store_true', help="Print all binary symbols") macho_group.add_argument('--imports', action='store_true', help="Print imported symbols") macho_group.add_argument('--exports', action='store_true', help="Print exported symbols") macho_group.add_argument('--imported_symbols', action='store_true', help="Print symbols imported from external libraries with dylib names") macho_group.add_argument('--chained_fixups', action='store_true', help="Print Chained Fixups information") macho_group.add_argument('--exports_trie', action='store_true', help="Print Export Trie information") macho_group.add_argument('--uuid', action='store_true', help="Print UUID") macho_group.add_argument('--main', action='store_true', help="Print entry point and stack size") macho_group.add_argument('--encryption_info', nargs='?',const='', help="Print encryption info if any. Optionally specify an output path to dump the encrypted data (if cryptid=0, data will be in plain text)", metavar="(optional) save_path.bytes") macho_group.add_argument('--strings_section', action='store_true', help="Print strings from __cstring section") macho_group.add_argument('--all_strings', action='store_true', help="Print strings from all sections") macho_group.add_argument('--save_strings', help="Parse all sections, detect strings, and save them to a file", metavar='all_strings.txt') macho_group.add_argument('--info', action='store_true', default=False, help="Print header, load commands, segments, sections, symbols, and strings") macho_group.add_argument('--dump_data', help="Dump {size} bytes starting from {offset} to a given {filename} (e.g. '0x1234,0x1000,out.bin')", metavar=('offset,size,output_path'), nargs="?") macho_group.add_argument('--calc_offset', help="Calculate the real address (file on disk) of the given Virtual Memory {vm_offset} (e.g. 0xfffffe000748f580)", metavar='vm_offset') macho_group.add_argument('--constructors', action='store_true', help="Print binary constructors") def addCodeSignArgs(self): codesign_group = self.parser.add_argument_group('CODE SIGNING ARGS') codesign_group.add_argument('--verify_signature', action='store_true', default=False, help="Code Signature verification (if the contents of the binary have been modified)") codesign_group.add_argument('--cd_info', action='store_true', default=False, help="Print Code Signature information") codesign_group.add_argument('--cd_requirements', action='store_true', default=False, help="Print Code Signature Requirements") codesign_group.add_argument('--entitlements', help="Print Entitlements in a human-readable, XML, or DER format (default: human)", nargs='?', const='human', metavar='human|xml|var') codesign_group.add_argument('--extract_cms', help="Extract CMS Signature from the Code Signature and save it to a given file", metavar='cms_signature.der') codesign_group.add_argument('--extract_certificates', help="Extract Certificates and save them to a given file. To each filename will be added an index at the end: _0 for signing, _1 for intermediate, and _2 for root CA certificate", metavar='certificate_name') codesign_group.add_argument('--remove_sig', help="Save the new file on a disk with removed signature", metavar='unsigned_binary') codesign_group.add_argument('--sign_binary', help="Sign binary using specified identity - use : 'security find-identity -v -p codesigning' to get the identity (default: adhoc)", nargs='?', const='adhoc', metavar='adhoc|identity') codesign_group.add_argument('--cs_offset', action='store_true', help="Print Code Signature file offset") codesign_group.add_argument('--cs_flags', action='store_true', help="Print Code Signature flags") def addChecksecArgs(self): checksec_group = self.parser.add_argument_group('CHECKSEC ARGS') checksec_group.add_argument('--has_pie', action='store_true', default=False, help="Check if Position-Independent Executable (PIE) is set") checksec_group.add_argument('--has_arc', action='store_true', default=False, help="Check if Automatic Reference Counting (ARC) is in use (can be false positive)") checksec_group.add_argument('--is_stripped', action='store_true', default=False, help="Check if binary is stripped") checksec_group.add_argument('--has_canary', action='store_true', default=False, help="Check if Stack Canary is in use (can be false positive)") checksec_group.add_argument('--has_nx_stack', action='store_true', default=False, help="Check if stack is non-executable (NX stack)") checksec_group.add_argument('--has_nx_heap', action='store_true', default=False, help="Check if heap is non-executable (NX heap)") checksec_group.add_argument('--has_xn', action='store_true', default=False, help="Check if binary is protected by eXecute Never (XN) ARM protection") checksec_group.add_argument('--is_notarized', action='store_true', default=False, help="Check if the application is notarized and can pass the Gatekeeper verification") checksec_group.add_argument('--is_encrypted', action='store_true', default=False, help="Check if the application is encrypted (has LC_ENCRYPTION_INFO(_64) and cryptid set to 1)") checksec_group.add_argument('--is_restricted', action='store_true', default=False, help="Check if binary has __RESTRICT segment or CS_RESTRICT flag set") checksec_group.add_argument('--is_hr', action='store_true', default=False, help="Check if the Hardened Runtime is in use") checksec_group.add_argument('--is_as', action='store_true', default=False, help="Check if the App Sandbox is in use") checksec_group.add_argument('--is_fort', action='store_true', default=False, help="Check if the binary is fortified") checksec_group.add_argument('--has_rpath', action='store_true', default=False, help="Check if the binary utilise any @rpath variables") checksec_group.add_argument('--has_lv', action='store_true', default=False, help="Check if the binary has Library Validation (protection against Dylib Hijacking)") checksec_group.add_argument('--checksec', action='store_true', default=False, help="Run all checksec module options on the binary") def addDylibsArgs(self): dylibs_group = self.parser.add_argument_group('DYLIBS ARGS') dylibs_group.add_argument('--dylibs', action='store_true', default=False, help="Print shared libraries used by specified binary with compatibility and the current version (loading paths unresolved, like @rpath/example.dylib)") dylibs_group.add_argument('--rpaths', action='store_true', default=False, help="Print all paths (resolved) that @rpath can be resolved to") dylibs_group.add_argument('--rpaths_u', action='store_true', default=False, help="Print all paths (unresolved) that @rpath can be resolved to") dylibs_group.add_argument('--dylibs_paths', action='store_true', default=False, help="Print absolute dylib loading paths (resolved @rpath|@executable_path|@loader_path) in order they are searched for") dylibs_group.add_argument('--dylibs_paths_u', action='store_true', default=False, help="Print unresolved dylib loading paths.") dylibs_group.add_argument('--broken_relative_paths', action='store_true', default=False, help="Print 'broken' relative paths from the binary (cases where the dylib source is specified for an executable directory without @executable_path)") dylibs_group.add_argument('--dylibtree', metavar=('cache_path,output_path,is_extracted'), nargs = '?', const=",,0", help='Print the dynamic dependencies of a Mach-O binary recursively. You can specify the Dyld Shared Cache path in the first argument, the output directory as the 2nd argument, and if you have already extracted DSC in the 3rd argument (0 or 1). The output_path will be used as a base for dylibtree. For example, to not extract DSC, use: --dylibs ",,1", or to extract from default to default use just --dylibs or --dylibs ",,0" which will extract DSC to extracted_dyld_share_cache/ in the current directory') dylibs_group.add_argument('--dylib_id', action='store_true', default=False, help="Print path from LC_ID_DYLIB") dylibs_group.add_argument('--reexport_paths', action='store_true', default=False, help="Print paths from LC_REEXPORT_DLIB") dylibs_group.add_argument('--hijack_sec', action='store_true', default=False, help="Check if binary is protected against Dylib Hijacking") dylibs_group.add_argument('--dylib_hijacking', metavar='(optional) cache_path' ,nargs="?", const="default", help="Check for possible Direct and Indirect Dylib Hijacking loading paths. The output is printed to console and saved in JSON format to /tmp/dylib_hijacking_log.json(append mode). Optionally, specify the path to the Dyld Shared Cache") dylibs_group.add_argument('--dylib_hijacking_a', metavar='cache_path', nargs="?", const="default", help="Like --dylib_hijacking, but shows only possible vectors (without protected binaries)") dylibs_group.add_argument('--prepare_dylib', metavar='(optional) target_dylib_name', nargs="?", const='', help="Compile rogue dylib. Optionally, specify target_dylib_path, it will search for the imported symbols from it in the dylib specified in the --path argument and automatically add it to the source code of the rogue lib. Example: --path lib1.dylib --prepare_dylib /path/to/lib2.dylib") def addDyldArgs(self): dyld_group = self.parser.add_argument_group('DYLD ARGS') dyld_group.add_argument('--is_built_for_sim', action='store_true', default=False, help="Check if binary is built for simulator platform.") dyld_group.add_argument('--get_dyld_env', action='store_true', default=False, help="Extract Dyld environment variables from the loader binary.") dyld_group.add_argument('--compiled_with_dyld_env', action='store_true', default=False, help="Check if binary was compiled with -dyld_env flag and print the environment variables and its values.") dyld_group.add_argument('--has_interposing', action='store_true', default=False, help="Check if binary has interposing sections.") dyld_group.add_argument('--interposing_symbols', action='store_true', default=False, help="Print interposing symbols if any.") def addAMFIArgs(self): dyld_group = self.parser.add_argument_group('AMFI ARGS') dyld_group.add_argument('--dump_prelink_info', metavar='(optional) out_name', nargs="?", const='PRELINK_info.txt', help='Dump "__PRELINK_INFO,__info" to a given file (default: "PRELINK_info.txt")') dyld_group.add_argument('--dump_prelink_text', metavar='(optional) out_name', nargs="?", const='PRELINK_text.txt', help='Dump "__PRELINK_TEXT,__text" to a given file (default: "PRELINK_text.txt")') dyld_group.add_argument('--dump_prelink_kext', metavar='kext_name', nargs="?", help='Dump prelinked KEXT {kext_name} from decompressed Kernel Cache PRELINK_TEXT segment to a file named: prelinked_{kext_name}.bin') dyld_group.add_argument('--kext_prelinkinfo', metavar='kext_name', nargs="?", help='Print _Prelink properties from PRELINK_INFO,__info for a give {kext_name}') dyld_group.add_argument('--kmod_info', metavar='kext_name', help="Parse kmod_info structure for the given {kext_name} from Kernel Cache") dyld_group.add_argument('--kext_entry', metavar='kext_name', help="Calculate the virtual memory address of the __start (entrypoint) for the given {kext_name} Kernel Extension") dyld_group.add_argument('--kext_exit', metavar='kext_name', help="Calculate the virtual memory address of the __stop (exitpoint) for the given {kext_name} Kernel Extension") dyld_group.add_argument('--mig', action='store_true', help="Search for MIG subsystem and prints message handlers") dyld_group.add_argument('--has_suid', action='store_true', help="Check if the file has SetUID bit set") dyld_group.add_argument('--has_sgid', action='store_true', help="Check if the file has SetGID bit set") dyld_group.add_argument('--has_sticky', action='store_true', help="Check if the file has sticky bit set") dyld_group.add_argument('--injectable_dyld', action='store_true', help="Check if the binary is injectable using DYLD_INSERT_LIBRARIES") dyld_group.add_argument('--test_insert_dylib', action='store_true', help="Check if it is possible to inject dylib using DYLD_INSERT_LIBRARIES (INVASIVE - the binary is executed)") dyld_group.add_argument('--test_prune_dyld', action='store_true', help="Check if Dyld Environment Variables are cleared (using DYLD_PRINT_INITIALIZERS=1) (INVASIVE - the binary is executed)") dyld_group.add_argument('--test_dyld_print_to_file', action='store_true', help="Check if DYLD_PRINT_TO_FILE Dyld Environment Variables works (INVASIVE - the binary is executed)") dyld_group.add_argument('--test_dyld_SLC', action='store_true', help="Check if DYLD_SHARED_REGION=private Dyld Environment Variables works and code can be injected using DYLD_SHARED_CACHE_DIR (INVASIVE - the binary is executed)") def parseArgs(self): return self.parser.parse_args() def printAllArgs(self, args): '''Just for debugging. This method is a utility designed to print all parsed arguments and their corresponding values.''' for arg, value in vars(args).items(): print(f"{arg}: {value}") ### --- SOURCE CODE --- ### class SourceCodeManager: crimson_stalker = r''' // clang -dynamiclib /tmp/crimson_stalker.c -o /tmp/crimson_stalker.dylib #include #include __attribute__((constructor)) void myconstructor(int argc, const char **argv) { syslog(LOG_ERR, "crimson_stalker library injected into %s\n", argv[0]); printf("crimson_stalker library injected into %s\n", argv[0]); } ''' dylib_hijacking = r''' // clang -dynamiclib m.c -o m.dylib //-o $PWD/TARGET_DYLIB #include #include #include #include __attribute__((constructor)) void myconstructor(int argc, const char **argv) { syslog(LOG_ERR, "[+] m.dylib injected in %s\n", argv[0]); printf("[+] m.dylib injected in %s\n", argv[0]); setuid(0); system("id"); //system("/bin/sh"); } ''' @staticmethod def clangCompilerWrapper(file_name_c, source_code, output_filename, flag_list=None): # Save the source code to a file with open(file_name_c, "w") as source_file: source_file.write(source_code) # Compile the source code using clang clang_command = ["clang", file_name_c, "-o", output_filename, *flag_list] subprocess.run(clang_command, check=True) ### --- APPLE CODE --- ### class AppleStructuresManager: ''' It stores Apple structures and their parsers. ''' class kmod_info(ctypes.Structure): ''' REF: https://github.com/apple-oss-distributions/xnu/blob/1031c584a5e37aff177559b9f69dbd3c8c3fd30a/osfmk/mach/kmod.h#L87 ''' _pack_ = 1 # Specify the byte order (little-endian) _fields_ = [ ("next", ctypes.c_uint64), # Simplifying the structure, it should be: struct kmod_info * next; ("info_version", ctypes.c_int32), ("id", ctypes.c_uint32), ("name", ctypes.c_char * 64), ("version", ctypes.c_char * 64), ("reference_count", ctypes.c_int32), ("reference_list", ctypes.c_uint64), ("address", ctypes.c_uint64), ("size", ctypes.c_uint64), ("hdr_size", ctypes.c_uint64), ("start", ctypes.c_uint64), ("stop", ctypes.c_uint64) ] def parse(data): # Create an instance of the kmod_info structure info = AppleStructuresManager.kmod_info() # Cast the binary data to the structure ctypes.memmove(ctypes.byref(info), data, ctypes.sizeof(info)) # Convert name and version to strings name = info.name.decode('utf-8').rstrip('\x00') version = info.version.decode('utf-8').rstrip('\x00') # Return parsed data as a dictionary return { "next": info.next, "info_version": info.info_version, "id": hex(info.id), "name": name, "version": version, "reference_count": info.reference_count, "reference_list": hex(info.reference_list), "address": hex(info.address), "size": hex(info.size), "hdr_size": hex(info.hdr_size), "start": hex(info.start), "stop": hex(info.stop) } class mig_subsystem(ctypes.Structure): ''' REF: https://github.com/apple-oss-distributions/xnu/blob/1031c584a5e37aff177559b9f69dbd3c8c3fd30a/osfmk/mach/mig.h#L121C16-L121C29 ''' _pack_ = 1 # Specify the byte order (little-endian) _fields_ = [ ("server", ctypes.c_uint64), # Pointer to demux routine ("start", ctypes.c_uint32), # Min routine number ("end", ctypes.c_uint32), # Max routine number + 1 ("maxsize", ctypes.c_uint64), # Max reply message size ("reserved", ctypes.c_uint64), # Reserved for MIG use ("routine_0", ctypes.c_uint64) # Routine descriptor array ] def parse(data): # Create an instance of the structure info = AppleStructuresManager.mig_subsystem() # Cast the binary data to the structure ctypes.memmove(ctypes.byref(info), data, ctypes.sizeof(info)) # Return parsed data as a dictionary return { "server": info.server, "start": info.start, "end": info.end, "maxsize": info.maxsize, "reserved": info.reserved, "routine_0": info.routine_0, } class routine_descriptor(ctypes.Structure): ''' REF: https://github.com/apple-oss-distributions/xnu/blob/1031c584a5e37aff177559b9f69dbd3c8c3fd30a/osfmk/mach/mig.h#L105C8-L105C26 ''' _pack_ = 1 # Specify the byte order (little-endian) _fields_ = [ ("impl_routine", ctypes.c_uint64), # Server work func pointer ("stub_routine", ctypes.c_uint64), # Unmarshalling func pointer ("argc", ctypes.c_uint32), # Number of argument words ("descr_count", ctypes.c_uint32), # Number complex descriptors ("arg_descr", ctypes.c_uint64), # Pointer to descriptor array ("max_reply_msg", ctypes.c_uint64) # Max size for reply msg ] def parse(data): # Create an instance of the structure info = AppleStructuresManager.routine_descriptor() # Cast the binary data to the structure ctypes.memmove(ctypes.byref(info), data, ctypes.sizeof(info)) # Return parsed data as a dictionary return { "impl_routine": info.impl_routine, "stub_routine": info.stub_routine, "argc": info.argc, "descr_count": info.descr_count, "arg_descr": info.arg_descr, "max_reply_msg": info.max_reply_msg, } class CodeDirectory(ctypes.BigEndianStructure): ''' REF: https://github.com/Karmaz95/Snake_Apple/blob/0b5b02fdb954ca5f63eb240092cf98a68fa4e19f/II.%20Code%20Signing/mac/cs_blobs.h#L212C16-L212C31''' class v0(ctypes.BigEndianStructure): _fields_ = [ ("magic", ctypes.c_uint32), ("length", ctypes.c_uint32), ("version", ctypes.c_uint32), ("flags", ctypes.c_uint32), ("hashOffset", ctypes.c_uint32), ("identOffset", ctypes.c_uint32), ("nSpecialSlots", ctypes.c_uint32), ("nCodeSlots", ctypes.c_uint32), ("codeLimit", ctypes.c_uint32), ("hashSize", ctypes.c_uint8), ("hashType", ctypes.c_uint8), ("platform", ctypes.c_uint8), ("pageSize", ctypes.c_uint8), ("spare2", ctypes.c_uint32), ] class v20100(v0): _fields_ = [ ("scatterOffset", ctypes.c_uint32), ] class v20200(v20100): _fields_ = [ ("teamOffset", ctypes.c_uint32), ] class v20300(v20200): _fields_ = [ ("spare3", ctypes.c_uint32), ("codeLimit64", ctypes.c_uint64), ] class v20400(v20300): _fields_ = [ ("execSegBase", ctypes.c_uint64), ("execSegLimit", ctypes.c_uint64), ("execSegFlags", ctypes.c_uint64), ] class v20500(v20400): _fields_ = [ ("runtime", ctypes.c_uint32), ("preEncryptOffset", ctypes.c_uint32), ] class v20600(v20500): _fields_ = [ ("linkageHashType", ctypes.c_uint8), ("linkageApplicationType", ctypes.c_uint8), ("linkageApplicationSubType", ctypes.c_uint16), ("linkageOffset", ctypes.c_uint32), ("linkageSize", ctypes.c_uint32), ] def __init__(self, version): self.version = version if version == 0x20100: self.info = self.v20100() elif version == 0x20200: self.info = self.v20200() elif version == 0x20300: self.info = self.v20300() elif version == 0x20400: self.info = self.v20400() elif version == 0x20500: self.info = self.v20500() elif version == 0x20600: self.info = self.v20600() else: self.info = self.v0() def parse(self, data): ctypes.memmove(ctypes.byref(self.info), data, min(ctypes.sizeof(self.info), len(data))) # Return parsed data as a dictionary return { "magic": getattr(self.info, "magic", None), "length": getattr(self.info, "length", None), "version": getattr(self.info, "version", None), "flags": getattr(self.info, "flags", None), "hashOffset": getattr(self.info, "hashOffset", None), "identOffset": getattr(self.info, "identOffset", None), "nSpecialSlots": getattr(self.info, "nSpecialSlots", None), "nCodeSlots": getattr(self.info, "nCodeSlots", None), "codeLimit": getattr(self.info, "codeLimit", None), "hashSize": getattr(self.info, "hashSize", None), "hashType": getattr(self.info, "hashType", None), "platform": getattr(self.info, "platform", None), "pageSize": getattr(self.info, "pageSize", None), "spare2": getattr(self.info, "spare2", None), "scatterOffset": getattr(self.info, "scatterOffset", None), "teamOffset": getattr(self.info, "teamOffset", None), "spare3": getattr(self.info, "spare3", None), "codeLimit64": getattr(self.info, "codeLimit64", None), "execSegBase": getattr(self.info, "execSegBase", None), "execSegLimit": getattr(self.info, "execSegLimit", None), "execSegFlags": getattr(self.info, "execSegFlags", None), "runtime": getattr(self.info, "runtime", None), "preEncryptOffset": getattr(self.info, "preEncryptOffset", None), "linkageHashType": getattr(self.info, "linkageHashType", None), "linkageApplicationType": getattr(self.info, "linkageApplicationType", None), "linkageApplicationSubType": getattr(self.info, "linkageApplicationSubType", None), "linkageOffset": getattr(self.info, "linkageOffset", None), "linkageSize": getattr(self.info, "linkageSize", None), } ### --- UTILS / DEBUG --- ### class Utils: def printQuadWordsLittleEndian64(byte_string, columns=2): ''' Print Q values from given {byte_string} in {columns} columns (default 2) 0000000000000000 FFFFFFFF00000001 6C7070612E6D6F63 7265766972642E65 ''' # Ensure the byte string length is a multiple of 8 while len(byte_string) % 8 != 0: byte_string += b'\x00' # Add padding to make it divisible by 8 # Convert the byte string to a list of integers byte_list = list(byte_string) # Group the bytes into 8-byte chunks chunks = [byte_list[i:i+8] for i in range(0, len(byte_list), 8)] # Print the raw bytes in 64-bit little-endian order print("Raw bytes (64-bit little-endian):") i = 1 for chunk in chunks: chunk_value = int.from_bytes(chunk, byteorder='little') if i < columns: print(f"{chunk_value:016X}", end=" ") else: print(f"{chunk_value:016X}", end="\n") i = 0 i+=1 print() def printQuadWordsBigEndian64(byte_string, columns=2): ''' Print Q values from given {byte_string} in {columns} columns (default 2) 0000000000000000 FFFFFFFF00000001 6C7070612E6D6F63 7265766972642E65 ''' # Ensure the byte string length is a multiple of 8 while len(byte_string) % 8 != 0: byte_string += b'\x00' # Add padding to make it divisible by 8 # Convert the byte string to a list of integers byte_list = list(byte_string) # Group the bytes into 8-byte chunks chunks = [byte_list[i:i+8] for i in range(0, len(byte_list), 8)] # Print the raw bytes in 64-bit big-endian order print("Raw bytes (64-bit big-endian):") i = 1 for chunk in chunks: chunk_value = int.from_bytes(chunk, byteorder='big') # Changed to 'big' if i < columns: print(f"{chunk_value:016X}", end=" ") else: print(f"{chunk_value:016X}", end="\n") i = 0 i += 1 print() def printRawHex(byte_string): ''' Print bytes as raw hexes (without endianess). 01 00 00 00 ff ff ... ''' hex_string = ' '.join(f'{byte:02x}' for byte in byte_string) print(hex_string) if __name__ == "__main__": arg_parser = ArgumentParser() args = arg_parser.parseArgs() file_path = os.path.abspath(args.path) ### --- I. MACH-O --- ### macho_processor = MachOProcessor(file_path) macho_processor.process(args) ### --- II. CODE SIGNING --- ### code_signing_processor = CodeSigningProcessor() code_signing_processor.process(args) ### --- III. CHECKSEC --- ### checksec_processor = ChecksecProcessor() checksec_processor.process(args) ### --- IV. DYLIBS --- ### dylibs_processor = DylibsProcessor() dylibs_processor.process(args) ### --- V. DYLD --- ### dyld_processor = DyldProcessor() dyld_processor.process(args) ### --- VI. AMFI --- ### amfi_processor = AMFIProcessor() amfi_processor.process(args)