From dceee00b32e33b6b187e9d8a67e86aa0038918b6 Mon Sep 17 00:00:00 2001 From: Karmaz95 Date: Sat, 9 Mar 2024 23:29:23 +0100 Subject: [PATCH] --- README.md | 8 +- .../PSEUDO_macos_dyld_policy_at_path.c | 4 +- .../PSEUDO_macos_dyld_policy_collect_state.c | 5 +- VI. AMFI/python/CrimsonUroboros.py | 1779 +++++++++++++++++ 4 files changed, 1788 insertions(+), 8 deletions(-) create mode 100755 VI. AMFI/python/CrimsonUroboros.py diff --git a/README.md b/README.md index abbd1ed..2c03ed4 100644 --- a/README.md +++ b/README.md @@ -284,9 +284,9 @@ brew install blacktop/tap/ipsw * `--dylib_hijacking` needs [ipsw](https://github.com/blacktop/ipsw) to be installed. * `--dylibtree` needs the [dyld-shared-cache-extractor](https://github.com/keith/dyld-shared-cache-extractor) to be installed. - ## WHY UROBOROS? -I will write the code for each article as a class SnakeX, where X will be the article number. To make it easier for the audience to follow. Each Snake class will be a child of the previous one and infinitely "eat itself" (inherit methods of the previous class), like Uroboros. +I will write the code for each article as a class SnakeX, where X will be the article number, to make it easier for the audience to follow. +Each Snake class will be a child of the previous one and infinitely "eat itself" (inherit methods of the previous class), like Uroboros. ## ADDITIONAL LINKS * [Apple Open Source](https://opensource.apple.com/releases/) @@ -301,4 +301,6 @@ I will write the code for each article as a class SnakeX, where X will be the ar * After making a SuperBlob parser and CodeDirectory blob parser, modify hasHardenedRuntime to check Runtime flag by using bitmask, instead of string. * Build Dyld Shared Cache parser and extractor to make SnakeIV independant of dyld-shared-cache-extractor. * Make testing branch and implement tests, before pushing new updates. -* Create `RottenApple.app` in another repository and use it for testing. \ No newline at end of file +* Create `RottenApple.app` in another repository and use it for testing. +* Add Dyld Closure chapter to Snake&Apple V - Dyld +* Move `dumpPrelink_info` and `dumpPrelink_text` to Snake & Apple chapter about Kernel Extensions when ready. \ No newline at end of file diff --git a/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_at_path.c b/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_at_path.c index 8ed46c7..197d3de 100644 --- a/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_at_path.c +++ b/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_at_path.c @@ -20,10 +20,10 @@ macos_dyld_policy_at_path(proc *process, amfi_dyld_policy_state_t *policy_state) log("RPL: 0, HR: 0, RP: 0, LV: 0"); } } else { - // 0x40 == CS_EXECSEG_JIT used ?? (not sure aobut it) + // Check if 0x40 == CS_EXECSEG_JIT is used ?? (not sure about it) if ((flags & 0x40) != 0) { - // (macOS Only) Page invalidation allowed by task port policy (CS_INVALID_ALLOWED == 0x20) not used + // Check if (macOS Only) Page invalidation allowed by task port policy (CS_INVALID_ALLOWED == 0x20) is not used if ((flags & 0x20) == 0) { // Check if process does not use Library Validation diff --git a/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_collect_state.c b/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_collect_state.c index a753354..8b18168 100644 --- a/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_collect_state.c +++ b/VI. AMFI/custom/AMFI_RE/PSEUDO_macos_dyld_policy_collect_state.c @@ -23,8 +23,8 @@ macos_dyld_policy_collect_state(calling_process, param_2, amfi_dyld_policy_state // Check if forced library validation is enabled (required by Hardened System Policy) has_CS_FORCED_LV = check_forced_library_validation(calling_process); - // Check macOS platform (hardware) - platform = get_platform(); + // Check if binary is inside trust cache (CS_PLATFORM_BINARY == 0x4000000 | CS_DYLD_PLATFORM == 0x2000000) + platform = is_platform_binary(); // Check if Hardened Runtime is enabled has_HR = check_hardened_runtime(calling_process); @@ -75,4 +75,3 @@ macos_dyld_policy_collect_state(calling_process, param_2, amfi_dyld_policy_state } - diff --git a/VI. AMFI/python/CrimsonUroboros.py b/VI. AMFI/python/CrimsonUroboros.py new file mode 100755 index 0000000..af79422 --- /dev/null +++ b/VI. AMFI/python/CrimsonUroboros.py @@ -0,0 +1,1779 @@ +#!/usr/bin/env python3 +import lief +import uuid +import argparse +import subprocess +import os +import sys +import mmap +import plistlib +import json +import sys +import treelib + +### --- I. MACH-O --- ### +class MachOProcessor: + def __init__(self, file_path): + '''This class contains part of the code from the main() for the SnakeI: Mach-O part.''' + self.file_path = os.path.abspath(file_path) + + def parseFatBinary(self): + '''Return Fat Binary object.''' + return lief.MachO.parse(self.file_path) + + def process(self, args): + '''Executes the code for the SnakeI: Mach-O.''' + if not os.path.exists(self.file_path): # Check if file_path specified in the --path argument exists. + print(f'The file {self.file_path} does not exist.') + exit() + + global binaries # It must be global, becuase after the MachOProcessor object is destructed, the snake_instance would point to invalid memory ("binary" is dependant on "binaries"). + global snake_instance # Must be global for further processors classes. + + binaries = self.parseFatBinary() + + if binaries == None: + exit() # Exit if not + + snake_instance = SnakeVI(binaries, self.file_path) # Initialize the latest Snake class + + if args.file_type: # Print binary file type + print(f'File type: {snake_instance.getFileType()}') + + if args.header_flags: # Print binary header flags + header_flag_list = snake_instance.getHeaderFlags() + print("Header flags:", " ".join(header_flag.name for header_flag in header_flag_list)) + + if args.endian: # Print binary endianess + print(f'Endianess: {snake_instance.getEndianess()}') + + if args.header: # Print binary header + print(snake_instance.getBinaryHeader()) + + if args.load_commands: # Print binary load commands + load_commands_list = snake_instance.getLoadCommands() + print("Load Commands:", " ".join(load_command.command.name for load_command in load_commands_list)) + + if args.segments: # Print binary segments in human friendly form + for segment in snake_instance.getSegments(): + print(segment) + + if args.sections: # Print binary sections in human friendly form + for section in snake_instance.getSections(): + print(section) + + if args.symbols: # Print symbols + for symbol in snake_instance.getSymbols(): + print(f"0x{symbol.value:016X} {symbol.name}") + + if args.imported_symbols: + snake_instance.printImportedSymbols() + + if args.chained_fixups: # Print Chained Fixups information + print(snake_instance.getChainedFixups()) + + if args.exports_trie: # Print Exports Trie information + print(snake_instance.getExportTrie()) + + if args.uuid: # Print UUID + print(f'UUID: {snake_instance.getUUID()}') + + if args.main: # Print entry point and stack size + snake_instance.printMain() + + if args.encryption_info is not None: # Print encryption info and save encrypted data if path is specified + snake_instance.printEncryptionInfo(args.encryption_info) + + if args.strings_section: # Print strings from __cstring section + print('Strings from __cstring section:') + print('-------------------------------') + for string in (snake_instance.getStringSection()): + print(string) + + if args.all_strings: # Print strings from all sections. + print(snake_instance.findAllStringsInBinary()) + + if args.save_strings: # Parse all sections, detect strings and save them to a file + extracted_strings = snake_instance.findAllStringsInBinary() + with open(args.save_strings, 'a') as f: + for s in extracted_strings: + f.write(s) + + if args.info: # Print all info about the binary + print('\n<=== HEADER ===>') + print(snake_instance.getBinaryHeader()) + print('\n<=== LOAD COMMANDS ===>') + for lcd in snake_instance.getLoadCommands(): + print(lcd) + print("="*50) + print('\n<=== SEGMENTS ===>') + for segment in snake_instance.getSegments(): + print(segment) + print('\n<=== SECTIONS ===>') + for section in snake_instance.getSections(): + print(section) + print('\n<=== SYMBOLS ===>') + for symbol in snake_instance.getSymbols(): + print(f"{(symbol.name).ljust(32)} {hex(symbol.value)}") + print('\n<=== STRINGS ===>') + print('Strings from __cstring section:') + print('-------------------------------') + for string in (snake_instance.getStringSection()): + print(string) + if snake_instance.binary.has_encryption_info: + print('\n<=== ENCRYPTION INFO ===>') + snake_instance.printEncryptionInfo() + print('\n<=== UUID ===>') + print(f'{snake_instance.getUUID()}') + print('\n<=== ENDIANESS ===>') + print(snake_instance.getEndianess()) + print('\n<=== ENTRYPOINT ===>') + snake_instance.printMain() + +class SnakeI: + def __init__(self, binaries, file_path): + ''' + When initiated, the program parses a Universal binary (binaries parameter) and extracts the ARM64 Mach-O. + If the file is not in a universal format but is a valid ARM64 Mach-O, it is taken as a binary parameter during initialization. + ''' + self.binary = self.parseFatBinary(binaries) + self.file_path = file_path + self.load_commands = self.getLoadCommands() + self.endianess = self.getEndianess() + self.fat_offset = self.binary.fat_offset # For various calculations, if ARM64 Mach-O extracted from Universal Binary + self.prot_map = { + 0: '---', + 1: 'r--', + 2: '-w-', + 3: 'rw-', + 4: '--x', + 5: 'r-x', + 6: '-wx', + 7: 'rwx' + } + self.segment_flags_map = { + 0x1: 'SG_HIGHVM', + 0x2: 'SG_FVMLIB', + 0x4: 'SG_NORELOC', + 0x8: 'SG_PROTECTED_VERSION_1', + 0x10: 'SG_READ_ONLY', + } + + def mapProtection(self, numeric_protection): + '''Maps numeric protection to its string representation.''' + return self.prot_map.get(numeric_protection, 'Unknown') + + def getSegmentFlags(self, flags): + '''Maps numeric segment flags to its string representation.''' + return self.segment_flags_map.get(flags, '') + #return " ".join(activated_flags) + + def parseFatBinary(self, binaries): + ''' + Parse Mach-O file, whether compiled for multiple architectures or just for a single one. + It returns the ARM64 binary if it exists. + If not, it exits the program. + ''' + for binary in binaries: + if binary.header.cpu_type == lief.MachO.CPU_TYPES.ARM64: + arm64_bin = binary + if arm64_bin == None: + print('The specified Mach-O file is not in ARM64 architecture.') + exit() + return arm64_bin + + def getFileType(self): + '''Extract and return the file type from a binary object's header.''' + return self.binary.header.file_type.name + + def getHeaderFlags(self): + '''Return binary header flags.''' + return self.binary.header.flags_list + + def getEndianess(self): + '''Check the endianness of a binary based on the system and binary's magic number.''' + magic = self.binary.header.magic.name + endianness = sys.byteorder + if endianness == 'little' and (magic == 'MAGIC_64' or magic == 'MAGIC' or magic == 'FAT_MAGIC'): + return 'little' + else: + return 'big' + + def getBinaryHeader(self): + '''https://lief-project.github.io/doc/stable/api/python/macho.html#header''' + return self.binary.header + + def getLoadCommands(self): + '''https://lief-project.github.io/doc/stable/api/python/macho.html#loadcommand''' + return self.binary.commands + + def getSegments(self): + '''Extract segmenents from binary and return a human readable string: https://lief-project.github.io/doc/stable/api/python/macho.html#lief.MachO.SegmentCommand''' + segment_info = [] + for segment in self.binary.segments: + name = segment.name + va_start = '0x' + format(segment.virtual_address, '016x') + va_end = '0x' + format(int(va_start, 16) + segment.virtual_size, '016x') + file_start = hex(segment.file_size + self.fat_offset) + file_end = hex(int(file_start, 16) + segment.file_size) + init_prot = self.mapProtection(segment.init_protection) + max_prot = self.mapProtection(segment.max_protection) + flags = self.getSegmentFlags(segment.flags) + if flags != '': + segment_info.append(f'{name.ljust(16)}{init_prot}/{max_prot.ljust(8)} VM: {va_start}-{va_end.ljust(24)} FILE: {file_start}-{file_end} ({flags})') + else: + segment_info.append(f'{name.ljust(16)}{init_prot}/{max_prot.ljust(8)} VM: {va_start}-{va_end.ljust(24)} FILE: {file_start}-{file_end}') + return segment_info + + def calcSectionRange(self, section): + ''' + The function calculates a section's start and end offset by adding the FAT slide in case of fat binary. + + Arg section is iterator object from the self.binary.sections (for section in self.binary.sections) + Return the start and end offset of the section. + ''' + start = section.offset + self.fat_offset + end = section.size + section.offset + self.fat_offset + return start, end + + def getSectionRange(self, segment_name, section_name): + ''' + Return section start and end file offset. + If there is no such section return False, False. + ''' + for section in self.binary.sections: + if segment_name == section.segment_name: + if section_name == section.fullname: + section_offset_start, section_offset_end = self.calcSectionRange(section) + return section_offset_start, section_offset_end + return False, False + + def getSections(self): + '''Extract sections from binary and return in human readable format: https://lief-project.github.io/doc/stable/api/python/macho.html#lief.MachO.Section''' + sections_info = [] + sections_info.append("SEGMENT".ljust(14) + "SECTION".ljust(20) + "TYPE".ljust(28) + "VIRTUAL MEMORY".ljust(32) + "FILE".ljust(26) + "FLAGS".ljust(40)) + sections_info.append(len(sections_info[0])*"=") + for section in self.binary.sections: + segment_name = section.segment_name + section_name = section.fullname + section_type = section.type.name + section_va_start = hex(section.virtual_address) + section_va_end = hex(section.virtual_address + section.offset) + section_size_start, section_size_end = self.calcSectionRange(section) + section_size_start = hex(section_size_start) + section_size_end = hex(section_size_end) + section_flags_list = section.flags_list + flags_strings = [flag.name for flag in section_flags_list] + flags = " ".join(flags_strings) + sections_info.append((f'{segment_name.ljust(14)}{section_name.ljust(20)}{section_type.ljust(28)}{section_va_start}-{section_va_end.ljust(20)}{section_size_start}-{section_size_end}\t\t({flags})')) + return sections_info + + def getSymbols(self): + '''Get all symbols from the binary (LC_SYMTAB, Chained Fixups, Exports Trie): https://lief-project.github.io/doc/stable/api/python/macho.html#symbol''' + return self.binary.symbols + + def getChainedFixups(self): + '''Return Chained Fixups information: https://lief-project.github.io/doc/latest/api/python/macho.html#chained-binding-info''' + return self.binary.dyld_chained_fixups + + def getExportTrie(self): + '''Return Export Trie information: https://lief-project.github.io/doc/latest/api/python/macho.html#dyldexportstrie-command''' + try: + return self.binary.dyld_exports_trie.show_export_trie() + except: + return "NO EXPORT TRIE" + + def getUUID(self): + '''Return UUID as string and in UUID format: https://lief-project.github.io/doc/stable/api/python/macho.html#uuidcommand''' + for cmd in self.binary.commands: + if isinstance(cmd, lief.MachO.UUIDCommand): + uuid_bytes = cmd.uuid + break + uuid_string = str(uuid.UUID(bytes=bytes(uuid_bytes))) + return uuid_string + + def getMain(self): + '''Determine the entry point of an executable.''' + return self.binary.main_command + + def printMain(self): + '''Prints entry point and stack size if exists.''' + entry_point = self.getMain() + if entry_point: + print(f'Entry point: {hex(self.getMain().entrypoint)}') + print(f'Stack size: {hex(self.getMain().stack_size)}') + else: + print(f"{self.file_path} has no entry point.") + + def getStringSection(self): + '''Return strings from the __cstring (string table).''' + extracted_strings = set() + for section in self.binary.sections: + if section.type == lief.MachO.SECTION_TYPES.CSTRING_LITERALS: + strings_bytes = section.content.tobytes() + strings = strings_bytes.decode('utf-8', errors='ignore') # Adjust the encoding as per your requirements + extracted_strings.update(strings.split('\x00')) + return extracted_strings + + def findAllStringsInBinary(self): + '''Check every binary section to find strings.''' + extracted_strings = "" + byte_set = set() + for section in self.binary.sections: + byte_set.update(section.content.tobytes().split(b'\x00')) + for byte_item in byte_set: + try: + decoded_string = byte_item.decode('utf-8') + extracted_strings += decoded_string + "\n" + except UnicodeDecodeError: + pass + return extracted_strings + + def getEncryptionInfo(self): + '''Return information regardles to LC_ENCRYPTION_INFO(_64).''' + if self.binary.has_encryption_info: + crypt_id = self.binary.encryption_info.crypt_id + crypt_offset = self.binary.encryption_info.crypt_offset + crypt_size = self.binary.encryption_info.crypt_size + return crypt_id, crypt_offset, crypt_size + else: + return None + + def printEncryptionInfo(self, save_path=''): + ''' + Pretty prints Encryption Info data if it exists. + If save_path argument is specified, save the encrypted data there. + If the cryptid is 0, the data is unencrypted. + ''' + encryption_info = self.getEncryptionInfo() + if encryption_info: + crypt_id, crypt_offset, crypt_size = encryption_info + print(f"cryptid: {crypt_id}") + print(f"cryptoffset: {hex(crypt_offset)}") + print(f"cryptsize: {hex(crypt_size)}") + if save_path: # args.encryption_info + self.saveEcryptedData(save_path.strip()) + else: + print(f"{os.path.basename(self.file_path)} binary does not have encryption info.") + + def extractBytesAtOffset(self, offset, size): + '''Extract bytes at a given offset and of a specified size in a binary file''' + # Open the binary file in binary mode + with open(self.file_path, "rb") as file: + # Check if the specified offset and size are within bounds + file_size = os.path.getsize(self.file_path) + #offset += self.fat_offset # Add the fat_offset in case of the Fat Binary (ARM binary data is most of the time after x86_64 binary data) + #print(hex(offset) + hex(size)) + if offset + size > file_size: + raise ValueError("Offset and size exceed the binary file's length.") + # Seek to the offset considering the fat_offset + file.seek(offset) + # Read the specified size of bytes + extracted_bytes = file.read(size) + return extracted_bytes + + def saveEcryptedData(self,output_path): + '''Method for saving encrypted data sector to specified file.''' + _, cryptoff, cryptsize = self.getEncryptionInfo() + self.saveBytesToFile(self.extractBytesAtOffset(cryptoff + self.fat_offset, cryptsize), output_path) + + def extractSection(self, segment_name, section_name): + ''' + As argument takes segment name (e.g. "__PRELINK_INFO") and section name that is a part of the segment (e.g. '__text'). + Return data (bytes) stored in a given section. + If section was not found, return False. + ''' + section_offset_start, section_offset_end = self.getSectionRange(segment_name, section_name) + if section_offset_start and section_offset_end: + size = section_offset_end - section_offset_start + extracted_bytes = self.extractBytesAtOffset(section_offset_start, size) + return extracted_bytes + return False + + def dumpSection(self, segment_name, section_name, filename): + ''' + Dump '__SEGMENT,__section' to a given file. + Reutrn False if the section does not exist. + ''' + extracted_bytes = self.extractSection(segment_name, section_name) + if extracted_bytes: + self.saveBytesToFile(extracted_bytes, filename) + return True + return False + +### --- II. CODE SIGNING --- ### +class CodeSigningProcessor: + def __init__(self): + '''This class contains part of the code from the main() for the SnakeII: Code Signing.''' + pass + + def process(self, args): + if args.verify_signature: # Verify if Code Signature match the binary content () + if snake_instance.isSigValid(snake_instance.file_path): + print("Valid Code Signature (matches the content)") + else: + print("Invalid Code Signature (does not match the content)") + + if args.cd_info: # Print Code Signature information + print(snake_instance.getCodeSignature(snake_instance.file_path).decode('utf-8')) + + if args.cd_requirements: # Print Requirements. + print(snake_instance.getCodeSignatureRequirements(snake_instance.file_path).decode('utf-8')) + + if args.entitlements: # Print Entitlements. + print(snake_instance.getEntitlementsFromCodeSignature(snake_instance.file_path, args.entitlements)) + + if args.extract_cms: # Extract the CMS Signature and save it to a given file. + cms_signature = snake_instance.extractCMS() + snake_instance.saveBytesToFile(cms_signature, args.extract_cms) + + if args.extract_certificates: # Extract Certificates and save them to a given file. + snake_instance.extractCertificatesFromCodeSignature(args.extract_certificates) + + if args.remove_sig: # Save a new file on a disk with the removed signature: + snake_instance.removeCodeSignature(args.remove_sig) + + if args.sign_binary: # Sign the given binary using specified identity: + snake_instance.signBinary(args.sign_binary) + +class SnakeII(SnakeI): + def __init__(self, binaries, file_path): + super().__init__(binaries, file_path) + self.magic_bytes = (0xFADE0B01).to_bytes(4, byteorder='big') # CMS Signature Blob magic bytes, as Code Signature as a whole is in network byte order(big endian). + + def isSigValid(self, file_path): + '''Checks if the Code Signature is valid (if the contents of the binary have been modified.)''' + result = subprocess.run(["codesign", "-v", file_path], capture_output=True) + if result.stderr == b'': + return True + else: + return False + + def getCodeSignature(self, file_path): + '''Returns information about the Code Signature.''' + result = subprocess.run(["codesign", "-d", "-vvvvvv", file_path], capture_output=True) + return result.stderr + + def getCodeSignatureRequirements(self, file_path): + '''Returns information about the Code Signature Requirements.''' + result = subprocess.run(["codesign", "-d", "-r", "-", file_path], capture_output=True) + return result.stdout + + def getEntitlementsFromCodeSignature(self, file_path, format=None): + '''Returns information about the Entitlements for Code Signature.''' + if format == 'human' or format == None: + result = subprocess.run(["codesign", "-d", "--entitlements", "-", file_path], capture_output=True) + return result.stdout.decode('utf-8') + elif format == 'xml': + result = subprocess.run(["codesign", "-d", "--entitlements", "-", "--xml", file_path], capture_output=True) + elif format == 'der': + result = subprocess.run(["codesign", "-d", "--entitlements", "-", "--der", file_path], capture_output=True) + return result.stdout + + def extractCMS(self): + '''Find the offset of magic bytes in a binary using LIEF.''' + cs = self.binary.code_signature + cs_content = bytes(cs.content) + offset = cs_content.find(self.magic_bytes) + cms_len_in_bytes = cs_content[offset + 4:offset + 8] + cms_len_in_int = int.from_bytes(cms_len_in_bytes, byteorder='big') + cms_signature = cs_content[offset + 8:offset + 8 + cms_len_in_int] + return cms_signature + + def saveBytesToFile(self, data, filename): + '''Save bytes to a file.''' + with open(filename, 'wb') as file: + file.write(data) + + def extractCertificatesFromCodeSignature(self, cert_name): + '''Extracts certificates from the CMS Signature and saves them to a file with _0, _1, _2 indexes at the end of the file names.''' + subprocess.run(["codesign", "-d", f"--extract-certificates={cert_name}_", self.file_path], capture_output=True) + + def removeCodeSignature(self, new_name): + '''Save new file on a disk with removed signature.''' + self.binary.remove_signature() + self.binary.write(new_name) + + def signBinary(self, security_identity=None): + '''Sign binary using pseudo identity (adhoc) or specified identity.''' + if security_identity == 'adhoc' or security_identity == None: + result = subprocess.run(["codesign", "-s", "-", "-f", self.file_path], capture_output=True) + return result.stdout.decode('utf-8') + else: + try: + result = subprocess.run(["codesign", "-s", security_identity, "-f", self.file_path], capture_output=True) + except Exception as e: + print(f"An error occurred during Code Signing using {security_identity}\n {e}") + +### --- III. CHECKSEC --- ### +class ChecksecProcessor: + def __init__(self): + '''This class contains part of the code from the main() for the SnakeIII: Checksec.''' + pass + + def process(self, args): + if args.has_pie: # Check if PIE is set in the header flags + print("PIE: " + str(snake_instance.hasPIE())) + + if args.has_arc: # Check if ARC is in use + print("ARC: " + str(snake_instance.hasARC())) + + if args.is_stripped: # Check if binary is stripped + print("STRIPPED: " + str(snake_instance.isStripped())) + + if args.has_canary: # Check if binary has stack canary + print("CANARY: " + str(snake_instance.hasCanary())) + + if args.has_nx_stack: # Check if binary has non executable stack + print("NX STACK: " + str(snake_instance.hasNXstack())) + + if args.has_nx_heap: # Check if binary has non executable heap + print("NX HEAP: " + str(snake_instance.hasNXheap())) + + if args.has_xn: # Check if binary is protected by eXecute Never functionality + print(f"eXecute Never: {str(snake_instance.hasXN())}") + + if args.is_notarized: # Check if the application is notarized and can pass the Gatekeeper verification + print("NOTARIZED: " + str(snake_instance.isNotarized(snake_instance.file_path))) + + if args.is_encrypted: # Check if the application has encrypted data + print("ENCRYPTED: " + str(snake_instance.isEncrypted())) + + if args.is_restricted: # Check if the application has encrypted data + print("RESTRICTED: " + str(snake_instance.isRestricted(snake_instance.file_path))) + + if args.is_hr: # Check if Hardened Runtime is in use + print("HARDENED: " + str(snake_instance.hasHardenedRuntimeFlag(snake_instance.file_path))) + + if args.is_as: # Check if App Sandbox is in use + print("APP SANDBOX: " + str(snake_instance.hasAppSandbox(snake_instance.file_path))) + + if args.is_fort: # Check if binary is fortified + fortified_symbols = snake_instance.getForifiedSymbols() + print("FORTIFIED: " + str(snake_instance.isFortified(fortified_symbols))) + + if args.has_rpath: # Check if binary has @rpaths + print("RPATH: " + str(snake_instance.hasRpath())) + + if args.has_lv: # Check if binary is protected against Dylib Hijacking + print("LIBRARY VALIDATION: " + str(snake_instance.checkDylibHijackingProtections(snake_instance.file_path))) + + if args.checksec: # Run all checks from above and present it in a table + print("<==== CHECKSEC ======") + print("PIE: ".ljust(16) + str(snake_instance.hasPIE())) + print("ARC: ".ljust(16) + str(snake_instance.hasARC())) + print("STRIPPED: ".ljust(16) + str(snake_instance.isStripped())) + print("CANARY: ".ljust(16) + str(snake_instance.hasCanary())) + print("NX STACK: ".ljust(16) + str(snake_instance.hasNXstack())) + print("NX HEAP: ".ljust(16) + str(snake_instance.hasNXheap())) + print("XN:".ljust(16) + str(snake_instance.hasXN())) + print("NOTARIZED: ".ljust(16) + str(snake_instance.isNotarized(snake_instance.file_path))) + print("ENCRYPTED: ".ljust(16) + str(snake_instance.isEncrypted())) + print("RESTRICTED: ".ljust(16) + str(snake_instance.isRestricted(snake_instance.file_path))) + print("HARDENED: ".ljust(16) + str(snake_instance.hasHardenedRuntimeFlag(snake_instance.file_path))) + print("APP SANDBOX: ".ljust(16) + str(snake_instance.hasAppSandbox(snake_instance.file_path))) + fortified_symbols = snake_instance.getForifiedSymbols() + print("FORTIFIED: ".ljust(16) + str(snake_instance.isFortified(fortified_symbols))) + print("RPATH: ".ljust(16) + str(snake_instance.hasRpath())) + print("LV: ".ljust(16) + str(snake_instance.checkDylibHijackingProtections(snake_instance.file_path))) + print("=====================>") + +class SnakeIII(SnakeII): + def __init__(self, binaries, file_path): + super().__init__(binaries, file_path) + + def hasPIE(self): + '''Check if MH_PIE (0x00200000) is set in the header flags.''' + return self.binary.is_pie + + def hasARC(self): + '''Check if the _objc_release symbol is imported.''' + for symbol in self.binary.symbols: + if symbol.name.lower().strip() == '_objc_release': + return True + return False + + def isStripped(self): + '''Check if binary is stripped.''' + filter_symbols = ['radr://5614542', '__mh_execute_header'] + + for symbol in self.binary.symbols: + symbol_type = symbol.type + symbol_name = symbol.name.lower().strip() + + is_symbol_stripped = (symbol_type & 0xe0 > 0) or (symbol_type in [0x0e, 0x1e, 0x0f]) + is_filtered = symbol_name not in filter_symbols + + if is_symbol_stripped and is_filtered: + return False + return True + + def hasCanary(self): + '''Check whether in the binary there are symbols: ___stack_chk_fail and ___stack_chk_guard.''' + canary_symbols = ['___stack_chk_fail', '___stack_chk_guard'] + for symbol in self.binary.symbols: + if symbol.name.lower().strip() in canary_symbols: + return True + return False + + def hasNXstack(self): + '''Check if MH_ALLOW_STACK_EXECUTION (0x00020000 ) is not set in the header flags.''' + return not bool(self.binary.header.flags & lief.MachO.HEADER_FLAGS.ALLOW_STACK_EXECUTION.value) + + def hasNXheap(self): + '''Check if MH_NO_HEAP_EXECUTION (0x01000000 ) is set in the header flags.''' + return bool(self.binary.header.flags & lief.MachO.HEADER_FLAGS.NO_HEAP_EXECUTION.value) + + def isXNos(): + '''Check if the OS is running on the ARM architecture.''' + system_info = os.uname() + if "arm" in system_info.machine.lower(): + return True + return False + + def checkXNmap(): + '''If XN is ON, you will not be able to map memory page that has W&X at the same time, so to check it, you can create such page.''' + try: + mmap.mmap(-1,4096, prot=mmap.PROT_READ | mmap.PROT_WRITE | mmap.PROT_EXEC) + except mmap.error as e: + #print(f"Failed to create W&X memory map - eXecute Never is supported on this machine. \n {str(e)}") + return True + return False + + def convertXMLEntitlementsToDict(self, entitlements_xml): + '''Takes the Entitlements in XML format from getEntitlementsFromCodeSignature() method and convert them to a dictionary.''' + return plistlib.loads(entitlements_xml) + + def convertDictEntitlementsToJson(self,entitlements_dict): + '''Takes the Entitlements in dictionary format from convertXMLEntitlementsToDict() method and convert them to a JSON with indent 4.''' + return json.dumps(entitlements_dict, indent=4) + + def checkIfEntitlementIsUsed(self, entitlement_name, entitlement_value, file_path): + '''Check if the given entitlement exists and has the specified value.''' + try: + entitlements_xml = self.getEntitlementsFromCodeSignature(file_path, 'xml') + if entitlements_xml == b'': # Return False if there are no entitlements + return False + entitlements_dict = self.convertXMLEntitlementsToDict(entitlements_xml) + # Convert the entire parsed data to lowercase for case-insensitive comparison + parsed_data = {key.lower(): value for key, value in entitlements_dict.items()} + # Convert entitlement name and value to lowercase for case-insensitive and type-insensitive comparison + entitlement_name_lower = entitlement_name.lower() + entitlement_value_lower = str(entitlement_value).lower() + + if entitlement_name_lower in parsed_data and str(parsed_data[entitlement_name_lower]).lower() == entitlement_value_lower: + return True + else: + return False + except json.JSONDecodeError as e: + # Handle JSON decoding error if any + print(f"Error in checkIfEntitlementIsUsed: {e}") + return False + + def hasAllowJITentitlement(self, file_path): + '''Checks if the binary has missing com.apple.security.cs.allow-jit entitlement that allows the app to create writable and executable memory using the MAP_JIT flag.''' + if self.checkIfEntitlementIsUsed('com.apple.security.cs.allow-jit', 'true', file_path): + print(f"[INFO -> XN]: {os.path.basename(file_path)} contains allow-jit entitlement.") + return True + return False + + def checkIfCompiledForOtherThanARM(self): + '''Iterates over FatBinary and check if there are other architectures than ARM.''' + XN_types = [lief.MachO.CPU_TYPES.ARM64, lief.MachO.CPU_TYPES.ARM] + for binary in binaries: + if binary.header.cpu_type not in XN_types: + print(f"[INFO -> XN]: {os.path.basename(file_path)} is compiled for other CPUs than ARM or ARM64.") + return True + return False + + def hasXN(self): + '''Check if binary allows W&X via com.apple.security.cs.allow-jit entitlement or is compiled for other CPU types than these which supports eXecuteNever feature of ARM.''' + if self.hasAllowJITentitlement(self.file_path) or self.checkIfCompiledForOtherThanARM(): + return False + return True + + def isNotarized(self, file_path): + '''Verifies if the application is notarized and can pass the Gatekeeper verification.''' + result = subprocess.run(["spctl", "-a", file_path], capture_output=True) + if result.stderr == b'': + return True + else: + #print(f"[INFO -> NOTARIZATION]: {result.stderr.decode().rstrip()}") + return False + + def isEncrypted(self): + '''If the cryptid has a non-zero value, some parts of the binary are encrypted.''' + if self.binary.has_encryption_info: + if self.binary.encryption_info.crypt_id == 1: + return True + return False + + def hasRestrictSegment(self): + '''Check if binary contains __RESTRICT segment. Return True if it does.''' + for segment in self.binary.segments: + if segment.name.lower().strip() == "__restrict": + return True + return False + + def hasRestrictFlag(self, file_path): + '''Check if Code Signature flag CS_RESTRICT 0x800(restrict) is set for the given binary''' + if b'restrict' in self.getCodeSignature(file_path): + return True + return False + + def isRestricted(self, file_path): + '''Check if binary has __RESTRICT segment or CS_RESTRICT flag set.''' + if self.hasRestrictSegment() or self.hasRestrictFlag(file_path): + return True + return False + + def hasHardenedRuntimeFlag(self, file_path): + '''Check if Hardened Runtime flag is set for the given binary.''' + if b'runtime' in self.getCodeSignature(file_path): + return True + return False + + def hasAppSandbox(self, file_path): + '''Check if App Sandbox is in use (com.apple.security.app-sandbox entitlement is set).''' + if self.checkIfEntitlementIsUsed('com.apple.security.app-sandbox', 'true', file_path): + return True + return False + + def getForifiedSymbols(self): + '''Check for symbol names that contain _chk suffix and filter out stack canary symbols. Function returns a list of all safe symbols.''' + symbol_fiter = ['___stack_chk_fail', '___stack_chk_guard'] + fortified_symbols = [] + for symbol in self.binary.symbols: + symbol_name = symbol.name.lower().strip() + if ('_chk' in symbol_name) and (symbol_name not in symbol_fiter): + fortified_symbols.append(symbol_name) + return fortified_symbols + + def isFortified(self, fortified_symbols): + '''Check if there are any fortified symbols in the give fortified_symbols list.''' + if len(fortified_symbols) > 0: + return True + return False + + def hasRpath(self): + return self.binary.has_rpath + +### --- IV. DYLIBS --- ### +class DylibsProcessor: + def __init__(self): + '''This class contains part of the code from the main() for the SnakeIV: Dylibs.''' + pass + + def process(self, args): + if args.dylibs: # Shared dylibs with unresolved paths + snake_instance.printDylibs() + + if args.rpaths: # All resolved paths from LC_RPATHs + snake_instance.printRpathsResolved() + + if args.rpaths_u: # All inresolved paths from LC_RPATHs + snake_instance.printRpathsUnresolved() + + if args.dylibs_paths: # Resolved dylib loading paths in order they are searched for + snake_instance.printResolvedDylibPaths() + + if args.dylibs_paths_u: # Unresolved dylib loading paths (same as --dylibs, but without version info) + snake_instance.printUnresolvedDylibPaths() + + if args.broken_relative_paths: # Relative paths + snake_instance.printBrokenRelativePaths() + + if args.dylibtree: # Dylibtree + args_dylibtree = args.dylibtree.split(',') + dylibtree = snake_instance.getDylibTree(args_dylibtree[0], args_dylibtree[1],args_dylibtree[2]) + snake_instance.printTreeFromTreelib(dylibtree) + + if args.dylib_id: # Path from Dylib ID Load Command + print(snake_instance.getPathFromDylibID()) + + if args.reexport_paths: # All reexported libraries paths + print(*snake_instance.getReExportPaths(), sep="\n") + + if args.hijack_sec: # Check Dylib Hijacking protection on binary + print("DYLIB HIJACKIG PROTECTION: " + str(snake_instance.checkDylibHijackingProtections(snake_instance.file_path))) + + if args.dylib_hijacking: # Direct & Indirect Dylib Hijacking check + if args.dylib_hijacking == 'default': + args.dylib_hijacking = None + all_results = snake_instance.dylibHijackingScanner(args.dylib_hijacking) + snake_instance.parseDylibHijackingScannerResults(all_results) + + if args.dylib_hijacking_a: # Show only possible vectors + if args.dylib_hijacking_a == 'default': + args.dylib_hijacking_a = None + all_results = snake_instance.dylibHijackingScanner(args.dylib_hijacking_a) + dh_check = snake_instance.isVulnDylibHijacking(all_results) + if dh_check: + print(dh_check) + + if args.prepare_dylib is not None: # Compile rogue dylib + snake_instance.prepareRogueDylib(args.prepare_dylib) + +class SnakeIV(SnakeIII): + def __init__(self, binaries, file_path): + ''' + When initiated, it run series of commands to extract: + - all load commands + - dylib loading commands + - dylib ID (if exists) + - rpaths (resolved) + - absolute paths (@executable_path|@loader_path|@rpath resolved) + Sets default Dyld Shared Cache location + ''' + super().__init__(binaries, file_path) + self.dylib_load_commands_names = { + 'LAZY_LOAD_DYLIB', + 'LOAD_DYLIB', + 'LOAD_UPWARD_DYLIB', + 'LOAD_WEAK_DYLIB', + 'PREBOUND_DYLIB', + 'REEXPORT_DYLIB', + } + self.dylib_id_path = self.getPathFromDylibID() # Get Dylib ID for @loader_path resolving + self.dylib_loading_commands, self.dylib_loading_commands_names = self.getDylibLoadCommands() # 1. Get dylib specific load commands + self.rpath_list = self.resolveRunPathLoadCommands() # 2. Get LC_RPATH list + self.absolute_paths = self.resolveDylibPaths() # 3. Get all dylib absolute paths dictionary {dylib_name[dylib_paths]} + self.dyld_share_cache_path = '/System/Volumes/Preboot/Cryptexes/OS/System/Library/dyld/dyld_shared_cache_arm64e' + + def getSharedLibraries(self, only_names=True): + ''' + Return array of shared libraries used by the binary. + When the only_names is set to False it aslo prints compatibility and current version of each library. + ''' + dylibs = [] + for library in self.binary.libraries: + if only_names: + dylibs.append(library.name) + else: + formatted_compat_version = ".".join(map(str, library.compatibility_version)) + formatted_current_version = ".".join(map(str, library.current_version)) + dylibs.append(f"{library.name} (compatibility version: {formatted_compat_version}, current version: {formatted_current_version})") + return dylibs + + def getDylibLoadCommands(self): + '''Return a list of load commands that load dylibs.''' + dylib_loading_commands = [] + dylib_loading_commands_names = [] + + for cmd in self.load_commands: + cmd_name = cmd.command.name + if cmd_name in self.dylib_load_commands_names: + dylib_loading_commands.append(cmd) + dylib_loading_commands_names.append(cmd_name) + + return dylib_loading_commands, dylib_loading_commands_names + + def getUnresolvedRunPathLoadCommandsPaths(self): + ''' + Return a list of unresolved paths (like @executable_path/Frameworks) from LC_RPATH load commands. Example return: + ['/usr/lib/swift', '@executable_path/Frameworks', '@loader_path/Frameworks'] + ''' + return [cmd.path for cmd in self.load_commands if cmd.command.name == 'RPATH'] + + def resolveRunPathLoadCommands(self): + ''' + Return a list of resolved (absolute) paths from LC_RPATH. Example return: + ['/usr/lib/swift', '/Applications/Suunto.app/WrappedBundle/Frameworks', '/Applications/Suunto.app/WrappedBundle/Frameworks'] + ''' + executable_path = os.path.dirname(self.file_path) + if self.dylib_id_path: + loader_path = self.dylib_id_path + else: + loader_path = executable_path + + unresolved_LC_RPATHS = self.getUnresolvedRunPathLoadCommandsPaths() + LC_RPATHS = [] + for path in unresolved_LC_RPATHS: + if path.startswith('@executable_path'): + path = path.replace('@executable_path',executable_path) + LC_RPATHS.append(path) + elif path.startswith('@loader_path'): + path = path.replace('@loader_path',loader_path) + LC_RPATHS.append(path) + else: + LC_RPATHS.append(path) + return LC_RPATHS + + def extractPathFromDylibLoadCommandStruct(self, dylib_load_command): + '''Extracts the string path from a dylib load command structure.''' + cmd_data = bytes(dylib_load_command.data) + offset_data = cmd_data[8:] + offset = int.from_bytes(offset_data[:4], byteorder=self.endianess) + string_data = cmd_data[offset:] + null_index = string_data.find(0) + path_bytes = string_data[:null_index] + path_string = path_bytes.decode('utf-8') + return path_string + + def resolveRunPathPaths(self, path): + ''' + Return ordered list of resolved @rpaths for the given dylib path. + Example return for self.rpath_list = ['/1/', '/2/'] and dylib path = @rpath/test.dylib + [ '/1/test.dylib', '/2/test.dylib'] + ''' + resolved_rpaths = [] + for rpath in self.rpath_list: + resolved_rpaths.append(path.replace('@rpath',rpath)) + return resolved_rpaths + + def resolveDylibPaths(self): + ''' + Return a dictionary of dylib_name : dylib_absolute_paths + Paths are absolute (with resolved @rpath, @executable_path, @loader_path) + ''' + executable_path = os.path.dirname(self.file_path) + if self.dylib_id_path: + loader_path = self.dylib_id_path + else: + loader_path = executable_path + absolute_paths = {} + + for dylib_load_command in self.dylib_loading_commands: + path = self.extractPathFromDylibLoadCommandStruct(dylib_load_command) + name = os.path.basename(path) + + if name not in absolute_paths: + absolute_paths[name] = [] + + if path.startswith('@executable_path'): + path = path.replace('@executable_path', executable_path) + absolute_paths[name].append(path) + + elif path.startswith('@rpath'): + paths = self.resolveRunPathPaths(path) + absolute_paths[name].extend(paths) + + elif path.startswith('@loader_path'): + path = path.replace('@loader_path', loader_path) + absolute_paths[name].append(path) + + else: + absolute_paths[name].append(path) + + return absolute_paths + + def checkBrokenRelativeDylibSource(self): + ''' + Check for bad dylib source. + When Dylib is relative, but does not use @executable_path | @loader_path | @rpath. + For example: mylib.dylib instead of @executable_path/mylib.dylib + ''' + broken_relative_dylibs = [] + for _, paths in self.absolute_paths.items(): # Iterate dylibs:paths dictionary + for path in paths: + if not path.startswith('/'): + broken_relative_dylibs.append(path) + + return broken_relative_dylibs + + def checkIfPathExists(self, path): + '''Check if specified path exists on the filesystem.''' + return os.path.exists(path) + + def checkIfPathExistsInDyldSharedCache(self, path, extracted_dyld_share_cache_directory_path): + '''Return if the path exists in the DSC - you must first extract it.''' + path = os.path.abspath(extracted_dyld_share_cache_directory_path) + "/" + path + return self.checkIfPathExists(path) + + def runDyldSharedCacheExtractor(self, dyld_share_cache_path, extracted_output_path): + '''Run dyld-shared-cache-extractor command.''' + command = ['dyld-shared-cache-extractor', dyld_share_cache_path, extracted_output_path] + subprocess.run(command, check=True) + + def getDylibTree(self, dyld_share_cache_path=None, extracted_output_path=None, is_extracted=0): + ''' + A function that inspects the dynamic dependencies of a Mach-O binary recursively (like recursive otool -L). + You must use absolute path in --path if you are using --dylibtree from extracted Dyld Shared Cache. + ''' + if dyld_share_cache_path in [None, '']: + dyld_share_cache_path = self.dyld_share_cache_path + + if extracted_output_path in [None, '']: + extracted_output_path = 'extracted_dyld_share_cache/' + extracted_output_path = os.path.abspath(extracted_output_path) # Convert to absolute path + + if is_extracted == '0': + self.runDyldSharedCacheExtractor(dyld_share_cache_path, extracted_output_path) + + dylibtree = treelib.Tree() + path_to_process = [self.file_path] + already_checked_paths = [] + not_existing_paths = [] # It could be the already_checked_paths for optimization, but for code clarity it stay. + node_id = 0 + dylibtree.create_node(self.file_path, node_id) + + while path_to_process: + current_path = path_to_process.pop() + + if (current_path not in path_to_process) and (current_path not in already_checked_paths) and (current_path not in not_existing_paths): + fat_binary = lief.MachO.parse(current_path) + dylib_snake_instance = SnakeIV(fat_binary, current_path) + + if current_path.startswith(extracted_output_path): + current_path = current_path.removeprefix(extracted_output_path) + + for _, dylib_paths in dylib_snake_instance.absolute_paths.items(): + for path in dylib_paths: # All dylibs for current binary (current_path from existing_path_to_process) + absolute_path = os.path.abspath(path) + node_id += 1 + filtered_nodes = list(dylibtree.filter_nodes(lambda node: node.tag == current_path)) + nid_of_first_occurance_of_dylib_in_dylibtree = filtered_nodes[0].identifier + # If path exist on the filesystem or DSC, add as a leaf to tree + ## current_path(root) -> absolute_path(leaf) + if absolute_path not in path_to_process: + if dylib_snake_instance.checkIfPathExists(absolute_path): + path_to_process.append(absolute_path) # Add this path to process recursively in while loop + dylibtree.create_node(absolute_path, node_id, parent=nid_of_first_occurance_of_dylib_in_dylibtree) # Add a path as a leaf + elif dylib_snake_instance.checkIfPathExistsInDyldSharedCache(path, extracted_output_path): + dsc_path = extracted_output_path + path + path_to_process.append(dsc_path) + dylibtree.create_node(absolute_path, node_id, data='\033[94mDSC\033[0m', parent=nid_of_first_occurance_of_dylib_in_dylibtree) # Add a path as a leaf + else: + not_existing_paths.append(absolute_path) + dylibtree.create_node(absolute_path, node_id, data='\033[91mWARNING - not existing path\033[0m', parent=nid_of_first_occurance_of_dylib_in_dylibtree) + + # If the node path (current_path) was checked, it should not be unwind again. + already_checked_paths.append(current_path) + already_checked_paths.append(extracted_output_path + current_path) + + return dylibtree + + def getDylibID(self): + ''' + Return a LC_ID_DYLIB Load Command if exists. + Dyld additionally check if the FILE TYPE == MH_DYLIB. + I intentionally omit this step to always extract ID. + ''' + for cmd in self.load_commands: + if cmd.command.name == 'ID_DYLIB': + return cmd + return None + + def getPathFromDylibID(self): + '''Return a path stored inside the Dylib ID Load Command.''' + dylib_id_lc = self.getDylibID() + if dylib_id_lc: + return self.extractPathFromDylibLoadCommandStruct(dylib_id_lc) + return None + + def printTreeFromTreelib(self, tree): + ''' + Helper function for printing the dylibtree. + It will only work with this structure because the root id is equal to 0 (tree.get_node(0)), which is not always true. + I had to write this to make pretty printing with data work because, by default, tree limb does not support printing with data. + Data is needed to show warnings if any library is missing on the filesystem and to inform if the library was from Dyld Share Cachce. + ''' + def recursivePrint(node, prefix="", last=True): + data_str = f": {node.data}" if node.data else "" + print(f"{prefix}{'`-- ' if last else '|-- '}{node.tag}{data_str}") + + children = tree.children(node.identifier) + count = len(children) + + for i, child in enumerate(children): + is_last = i == count - 1 + child_prefix = f"{prefix}{' ' if last else '| '}" + recursivePrint(child, child_prefix, is_last) + + root = tree.get_node(0) + recursivePrint(root) + + def printDylibs(self): + dylibs = self.getSharedLibraries(only_names=False) + if dylibs: + print(f"{self.file_path} depends on libraries:") + for d in dylibs: + print(f"\t{d}") + else: + print(f"{self.file_path} does not depend on any libraries.") + + def printRpathsResolved(self): + '''Print all paths that @rpath can be resolved to.''' + print(*self.rpath_list, sep="\n") + + def printRpathsUnresolved(self): + print(*self.getUnresolvedRunPathLoadCommandsPaths(), sep="\n") + + def printResolvedDylibPaths(self): + '''Prints all resolved (absolute) dylib loading commands paths.''' + for _, dylib_paths in self.absolute_paths.items(): + print(*dylib_paths, sep='\n') + + def printUnresolvedDylibPaths(self): + '''Prints all unresolved (with @rpath|@executable_path|@loader_path) dylib loading commands paths.''' + for dylib_load_command in self.dylib_loading_commands: + print(self.extractPathFromDylibLoadCommandStruct(dylib_load_command)) + + def printBrokenRelativePaths(self): + '''Print 'broken' relative paths from the binary (cases where the dylib source is specified for an executable directory without @executable_path)''' + for broken_path in self.checkBrokenRelativeDylibSource(): + print(broken_path) + + def getMissingPaths(self): + '''Return two unique lists of missing and existing paths.''' + missing_paths = [] + existing_paths = [] + for _, paths in self.absolute_paths.items(): + for path in paths: + if os.path.exists(path): + existing_paths.append(path) + break # Stop checking further paths for this dylib + else: + missing_paths.append(path) + unique_missing = list(set(missing_paths)) + unique_existing = list(set(existing_paths)) + return unique_missing, unique_existing + + def checkWriteAccessMissing(self, paths): + ''' + Check write access for the given paths. + In case the directory does not exists, traverse back till directory that exists and check write access there. + Return a list of writeable directories. + ''' + write_accessible_paths = [] + for path in paths: + current_path = path + if os.access(current_path, os.W_OK): + write_accessible_paths.append(path) + continue + while current_path: + current_path = os.path.dirname(current_path) + if not os.path.exists(current_path): + continue + if os.access(current_path, os.W_OK): + write_accessible_paths.append(path) + break + else: + break + + return write_accessible_paths + + def checkWriteAccessExisting(self, paths): + '''Return a list of write-accessible paths.''' + write_accessible_paths = [] + for path in paths: + if os.access(path, os.W_OK): + write_accessible_paths.append(path) + + return write_accessible_paths + + def hasLibraryValidationFlag(self, file_path): + '''Check Library validation flag for given binary.''' + if b'library-validation' in self.getCodeSignature(file_path): + return True + return False + + def hasDisableLibraryValidationEntitlement(self, file_path): + ''' + Checks if the binary has com.apple.security.cs.disable-library-validation or com.apple.private.security.clear-library-validation entitlement set. + They allows loading dylibs without requiring code signing. + ''' + if self.checkIfEntitlementIsUsed('com.apple.security.cs.disable-library-validation', 'true', file_path) or self.checkIfEntitlementIsUsed('com.apple.private.security.clear-library-validation','true', file_path): + return True + return False + + def getDyldSharedCacheDylibsPaths(self, dsc_path): + ''' + Parse Dyld Shared Cache using ipsw to extract dylib paths. + Ref: https://blacktop.github.io/ipsw/docs/guides/dyld/ + ''' + if dsc_path == None: + dsc_path = self.dyld_share_cache_path + + command = f"ipsw dyld info {dsc_path} -l -j >> /tmp/dyld_shared_cache_temp_1234.json" + subprocess.run(command, shell=True, check=True) + + with open('/tmp/dyld_shared_cache_temp_1234.json', 'r') as file: + data = json.load(file) + os.remove('/tmp/dyld_shared_cache_temp_1234.json') + + # jq -r '.dylibs[].name' dsc.json + paths = [dylib['name'] for dylib in data.get('dylibs', [])] + return paths + + def printDyldSharedCacheDylibsPaths(self, dsc_path): + '''Print Dyld paths from Dyld Shared Cache.''' + if dsc_path == None: + dsc_path = self.dyld_share_cache_path + + paths = self.getDyldSharedCacheDylibsPaths(dsc_path) + for path in paths: + print(path) + + def checkDylibHijackingProtections(self, file_path): + ''' + Check protections against dylib hijacking. + Return True if protected (has library validation ON). + ''' + + # Check if 'com.apple.security.cs.disable-library-validation' or 'com.apple.private.security.clear-library-validation' entitlements are present and set to true - INSECURE. + has_insecure_entitlement = self.hasDisableLibraryValidationEntitlement(file_path) + + # Check if Library validation or Hardened runtime is active - SECURE + is_hardened_runtime_active = self.hasHardenedRuntimeFlag(file_path) + is_library_validation_active = self.hasLibraryValidationFlag(file_path) + + if has_insecure_entitlement: # Entitlements disables protections + return False + elif is_hardened_runtime_active or is_library_validation_active: # If there are no entitlements and HR or LV exists, then protections is ON + return True + else: # If there are no insecure entitlements, but there are also no HR or LV, there are no protections + return False + + def dylibHijackingScanner(self, dyld_share_cache_path): + ''' + Direct and Indirect Dylib Hijacking Scanner - return dictionary of results for main binary and each dependancy. + Save JSON format to /tmp/dylib_hijacking_log.json. + Return results dictionary. + ''' + + if dyld_share_cache_path in [None, '']: + dyld_share_cache_path = self.dyld_share_cache_path + + dsc_paths = self.getDyldSharedCacheDylibsPaths(dyld_share_cache_path) + already_checked_paths = [] + all_results = {} + path_to_process = [self.file_path] + + while path_to_process: + current_path = path_to_process.pop() + + result = { + 'is_protected' : bool, + 'writeable_missing_paths' : [], + 'writeable_existing_paths' : [] + } + + if (current_path not in already_checked_paths) and (current_path not in dsc_paths): + fat_binary = lief.MachO.parse(current_path) + dylib_snake_instance = SnakeIV(fat_binary, current_path) + + missing_paths, existing_paths = dylib_snake_instance.getMissingPaths() + result['writeable_missing_paths'] = dylib_snake_instance.checkWriteAccessMissing(missing_paths) + result['writeable_existing_paths'] = dylib_snake_instance.checkWriteAccessExisting(existing_paths) + result['is_protected'] = dylib_snake_instance.checkDylibHijackingProtections(dylib_snake_instance.file_path) + + already_checked_paths.append(current_path) + path_to_process.extend(existing_paths) + all_results[current_path] = result + + json_file_path = '/tmp/dylib_hijacking_log.json' + with open(json_file_path, 'a') as json_file: + json.dump(all_results, json_file) + + return all_results + + def isVulnDylibHijacking(self, all_results): + ''' + Automatically decide if target is vulnerable to Dylib Hijacking. + Returns vulnerability info or None if protected. + ''' + root_binary = True + info = '' + + for current_path, result in all_results.items(): + + if root_binary and result['is_protected']: + return # Root binary is protected - not vuln + + if not result['is_protected']: + if result['writeable_existing_paths'] or result['writeable_missing_paths']: + if root_binary: + info += (f'\033[91mVULNERABLE ROOT BINARY\033[0m: {current_path}\n') + root_binary = False + else: + info += (f'\033[91mVULNERABLE DEPENDENCY\033[0m: {current_path}\n') + if result['writeable_existing_paths']: + info += (f"\033[91mWRITEABLE EXISTING PATHS\033[0m: {', '.join(map(str, result['writeable_existing_paths']))}\n") + if result['writeable_missing_paths']: + info += (f"\033[91mWRITEABLE MISSING PATHS\033[0m: {', '.join(map(str, result['writeable_missing_paths']))}\n") + + if info: + return info + else: + return + + def parseDylibHijackingScannerResults(self, all_results): + ''' + Print the dylibHijackingScanner results in a nice format. + ''' + first_iteration = True + + for current_path, result in all_results.items(): + if first_iteration: + if result['is_protected']: + print(f"\033[92mROOT BINARY PROTECTED\033[0m: {current_path}") + else: + print(f"\033[91mROOT BINARY NOT PROTECTED\033[0m: {current_path}") + first_iteration = False + else: + if result['is_protected']: + print(f"\033[92mPROTECTED\033[0m: {current_path}") + else: + print(f"\033[91mNOT PROTECTED\033[0m: {current_path}") + if result['writeable_existing_paths']: + print(f"\033[91mWRITEABLE EXISTING PATHS\033[0m: {', '.join(map(str, result['writeable_existing_paths']))}") + if result['writeable_missing_paths']: + print(f"\033[91mWRITEABLE MISSING PATHS\033[0m: {', '.join(map(str, result['writeable_missing_paths']))}") + print("-"*28) + + def getReExportLoadCommands(self): + ''' + Return a list of REEXPORT_DYLIB Load Commands if exists. + ''' + reexport_load_commands = [] + for cmd in self.load_commands: + if cmd.command.name == 'REEXPORT_DYLIB': + reexport_load_commands.append(cmd) + return reexport_load_commands + + def getReExportPaths(self): + '''Return paths stored inside the REEXPORT_DYLIB Load Commands.''' + reexport_load_commands = self.getReExportLoadCommands() + paths = [] + if reexport_load_commands: + for load_command in reexport_load_commands: + paths.append(self.extractPathFromDylibLoadCommandStruct(load_command)) + return paths + + def getImportedSymbols(self): + '''Return a dictionary of imported symbols and names of external libraries where they come from.''' + imported_symbols = {} + + for symbol in self.binary.imported_symbols: + binding_info = symbol.binding_info + + if binding_info: + dylib = binding_info.library + + if dylib: + imported_symbols[symbol.name] = dylib.name + + return imported_symbols + + def printImportedSymbols(self): + ''' + Parse getImportedSymbols dictionary in grepable form and print it. + Symbol names are grouped (sorted) by library. Example output: + symbol_name : library1 + symbol_name : library1 + symbol_name : library2 + symbol_name : library3 + ''' + imported_symbols = self.getImportedSymbols() + grouped_symbols = {} + + # Group symbols by unresolved library path + for symbol_name, unresolved_library_path in imported_symbols.items(): + if unresolved_library_path not in grouped_symbols: + grouped_symbols[unresolved_library_path] = [] + grouped_symbols[unresolved_library_path].append(symbol_name) + + # Print the grouped symbols + for unresolved_library_path, symbols in grouped_symbols.items(): + for symbol_name in symbols: + print(f'{symbol_name} : {unresolved_library_path}') + + def getImportedSymbolsFromTargetLib(self, external_library_name): + ''' + This function is like a `cat printImportedSymbols | grep external_library`. + Filter imported symbols in binary (--path binary) to only those from specified external library (--preapre_dylib external_library_name). + + https://lief-project.github.io/doc/stable/api/python/macho.html#binary + https://lief-project.github.io/doc/stable/api/python/macho.html#binding-info + https://lief-project.github.io/doc/stable/api/python/macho.html#dylibcommand + ''' + imported_symbols = self.getImportedSymbols() + grep_result = [] + for symbol_name, unresolved_library_path in imported_symbols.items(): + if external_library_name in unresolved_library_path: + grep_result.append(symbol_name) + + return grep_result + + def prepareRogueDylib(self, target_library_path=''): + ''' + Compile m.dylib which by default: + 1. Prints log about successful injection to stdout & stderr syslog. + 2. If the binary is SUID, sets RUID to EUID and prints user ID. + ''' + file_name_c = 'm.c' + source_code = SourceCodeManager.dylib_hijacking + output_filename = 'm.dylib' + flag_list = ['-dynamiclib'] + + if target_library_path: + imported_sybols = self.getImportedSymbolsFromTargetLib(target_library_path) + else: + imported_sybols = [] + + if imported_sybols: + for symbol in imported_sybols: + if symbol.startswith('_'): + symbol = symbol[1:] + function_to_add = f'\nvoid {symbol}(void){{}}' + source_code += function_to_add + + SourceCodeManager.clangCompilerWrapper(file_name_c, source_code, output_filename, flag_list) + +### --- V. DYLD --- ### +class DyldProcessor: + def __init__(self): + '''This class contains part of the code from the main() for the SnakeV: Dyld.''' + pass + + def process(self, args): + if args.is_built_for_sim: # Check if binary is build for a simulator + snake_instance.printIsBuiltForSimulator() + + if args.get_dyld_env: # Extract DYLD environment variables from the loader binary + snake_instance.printDyldEnv() + + if args.compiled_with_dyld_env: # Print Environment variables from the LC_DYLD_ENVIRONMENT + snake_instance.printDyldEnvLoadCommands() + + if args.has_interposing: # Print if binary has interposing sections + print("INTERPOSING: " + str(snake_instance.hasInterposing())) + + if args.interposing_symbols: # Print all replacement symbols from the __interpose section + snake_instance.printInterposingSymbols() + +class SnakeV(SnakeIV): + def __init__(self, binaries, file_path): + super().__init__(binaries, file_path) + self.platforms = { + 1: 'PLATFORM_MACOS', + 2: 'PLATFORM_IOS', + 3: 'PLATFORM_TVOS', + 4: 'PLATFORM_WATCHOS', + 5: 'PLATFORM_BRIDGEOS', + 6: 'PLATFORM_MACCATALYST', + 7: 'PLATFORM_IOSSIMULATOR', + 8: 'PLATFORM_TVOSSIMULATOR', + 9: 'PLATFORM_WATCHOSSIMULATOR', + 10: 'PLATFORM_DRIVERKIT' + } # https://github.com/Karmaz95/Snake_Apple/blob/main/IV.%20Dylibs/macos/loader.h#L1275 + + def isBuiltForSimulator(self): + ''' + Function for --is_built_for_sim flag. + https://lief-project.github.io/doc/stable/api/python/macho.html#lief.MachO.BuildVersion.PLATFORMS + Returns True if platform is in : + #define PLATFORM_IOSSIMULATOR 7 + #define PLATFORM_TVOSSIMULATOR 8 + #define PLATFORM_WATCHOSSIMULATOR 9. + ''' + simulator_platforms = [7,8,9] + platform_value = self.binary.build_version.platform.value + if platform_value in simulator_platforms: + return True, platform_value + elif platform_value > 10: + return None, platform_value + else: + return False, platform_value + + def printIsBuiltForSimulator(self): + ''' + Print text instead of True|False from the isBuiltForSimulator return. + Example outputs: + test platform is PLATFORM_IOSSIMULATOR -> built for simulator. + executable platform is PLATFORM_MACOS -> not built for simulator + ''' + name = os.path.basename(self.file_path) + platform_check, platform_value = self.isBuiltForSimulator() + if platform_check == True: + print(f'{name} platform is \033[94m{self.platforms[platform_value]}\033[0m\033[91m -> built for simulator\033[0m. ') + elif platform_check == None: + print(f'{name} is build for UNKNOWN platform -> \033[94m{platform_value}\033[0m') + else: + print(f'{name} platform is \033[94m{self.platforms[platform_value]}\033[0m\033[92m -> not built for simulator\033[0m') + + def getDyldEnv(self): + '''Return a list of DYLD environment variables from the binary.''' + dyld_env = [] + strings_from_CSTRING = self.getStringSection() + for s in strings_from_CSTRING: + if s.startswith('DYLD_') and '/' not in s: + # Exclude DYLD_$ paths (that starts and ends with DYLD_) + if s.endswith('DYLD_'): + continue + # Remove spaces and all after the first occurrence of space + s = s.split(' ')[0].strip() + if s not in dyld_env: + dyld_env.append(s) + return dyld_env + + def printDyldEnv(self): + '''Print DYLD environment variables from the binary.''' + dyld_env = self.getDyldEnv() + if dyld_env: + print(*dyld_env, sep='\n') + else: + print("No DYLD environment variables found.") + + def enumDyldEnvLoadCommands(self): + '''Check if binary has DYLD_ENVIRONMENT load commands.''' + all_dyld_env = [] + + for cmd in self.load_commands: + if cmd.command.name == 'DYLD_ENVIRONMENT': + all_dyld_env.append(cmd) + + return all_dyld_env + + def printDyldEnvLoadCommands(self): + '''Print DYLD_ENVIRONMENT load commands.''' + all_dyld_env = self.enumDyldEnvLoadCommands() + + if all_dyld_env: + for cmd in all_dyld_env: + print(cmd.value) + + def hasInterposing(self): + '''Check if binary has interposing sections.''' + for section in self.binary.sections: + if section.name == "__interpose": + return True + return False + + def getInterposingSymbolsAddresses(self): + '''Get replacement symbols addresses from the __interpose section.''' + interposing_symbols_addresses = [] + bit_mask = 0xffffffff + + if self.hasInterposing(): + for section in self.binary.sections: + if section.name == "__interpose": + for i in range(0, len(section.content), 16): + address = int.from_bytes(section.content[i:i+8], byteorder=self.endianess) + interposing_symbols_addresses.append(address) + + # Remove binary virtual address base to get the symbol offset only ['0x3f54'] instead of ['0x10000000003f54'] + i = 0 + for addr in interposing_symbols_addresses: + interposing_symbols_addresses[i] = addr & bit_mask + i+=1 + + return interposing_symbols_addresses + + def getInterposingSymbols(self): + '''Get all replacement symbols from the __interpose section.''' + interposing_symbols_addresses = self.getInterposingSymbolsAddresses() + interposing_symbols_names = [] + + if interposing_symbols_addresses: + for symbol in self.getSymbols(): + if symbol.value in interposing_symbols_addresses: + interposing_symbols_names.append(symbol.name) + + return interposing_symbols_names, interposing_symbols_addresses + + def printInterposingSymbols(self): + '''Print all replacement symbols from the __interpose section.''' + symbol_names, symbol_addrs = self.getInterposingSymbols() + for symbol_name, symbol_addrs in zip(symbol_names, symbol_addrs): + print(f"{(symbol_name).ljust(32)} {hex(symbol_addrs)}") + +### --- VI. AMFI --- ### +class AMFIProcessor: + def __init__(self): + '''This class contains part of the code from the main() for the SnakeVI: AMFI.''' + pass + + def process(self, args): + if args.dump_prelink_info is not None: # nargs="?", const='PRELINK_info.txt' # Dump '__PRELINK_INFO,__info' to a given file (default: 'PRELINK_info.txt') + snake_instance.dumpPrelink_info(args.dump_prelink_info) + + if args.dump_prelink_text is not None: # Dump '__PRELINK_TEXT,__text' to a given file (default: 'PRELINK_text.txt') + snake_instance.dumpPrelink_text(args.dump_prelink_text) + + if args.amfi: + pass + +class SnakeVI(SnakeV): + def __init__(self, binaries, file_path): + super().__init__(binaries, file_path) + + def dumpPrelink_info(self, filename): + ''' Dump '__PRELINK_INFO,__info' to a given file (default: 'PRELINK_info.txt') ''' + segment_name = '__PRELINK_INFO' + section_name = '__info' + self.dumpSection(segment_name, section_name, filename) + + def dumpPrelink_text(self, filename): + ''' Dump '__PRELINK_TEXT,__text' to a given file (default: 'PRELINK_text.txt') ''' + segment_name = '__PRELINK_TEXT' + section_name = '__text' + self.dumpSection(segment_name, section_name, filename) + + +### --- ARGUMENT PARSER --- ### +class ArgumentParser: + def __init__(self): + '''Class for parsing arguments from the command line. I decided to remove it from main() for additional readability and easier code maintenance in the VScode''' + self.parser = argparse.ArgumentParser(description="Mach-O files parser for binary analysis") + self.addGeneralArgs() + self.addMachOArgs() + self.addCodeSignArgs() + self.addChecksecArgs() + self.addDylibsArgs() + self.addDyldArgs() + self.addAMFIArgs() + + def addGeneralArgs(self): + self.parser.add_argument('-p', '--path', required=True, help="Path to the Mach-O file") + + def addMachOArgs(self): + macho_group = self.parser.add_argument_group('MACH-O ARGS') + macho_group.add_argument('--file_type', action='store_true', help="Print binary file type") + macho_group.add_argument('--header_flags', action='store_true', help="Print binary header flags") + macho_group.add_argument('--endian', action='store_true', help="Print binary endianess") + macho_group.add_argument('--header', action='store_true', help="Print binary header") + macho_group.add_argument('--load_commands', action='store_true', help="Print binary load commands names") + macho_group.add_argument('--segments', action='store_true', help="Print binary segments in human-friendly form") + macho_group.add_argument('--sections', action='store_true', help="Print binary sections in human-friendly form") + macho_group.add_argument('--symbols', action='store_true', help="Print all binary symbols") + macho_group.add_argument('--imported_symbols', action='store_true', help="Print symbols imported from external libraries") + macho_group.add_argument('--chained_fixups', action='store_true', help="Print Chained Fixups information") + macho_group.add_argument('--exports_trie', action='store_true', help="Print Export Trie information") + macho_group.add_argument('--uuid', action='store_true', help="Print UUID") + macho_group.add_argument('--main', action='store_true', help="Print entry point and stack size") + macho_group.add_argument('--encryption_info', nargs='?',const='', help="Print encryption info if any. Optionally specify an output path to dump the encrypted data (if cryptid=0, data will be in plain text)", metavar="(optional) save_path.bytes") + macho_group.add_argument('--strings_section', action='store_true', help="Print strings from __cstring section") + macho_group.add_argument('--all_strings', action='store_true', help="Print strings from all sections") + macho_group.add_argument('--save_strings', help="Parse all sections, detect strings, and save them to a file", metavar='all_strings.txt') + macho_group.add_argument('--info', action='store_true', default=False, help="Print header, load commands, segments, sections, symbols, and strings") + + def addCodeSignArgs(self): + codesign_group = self.parser.add_argument_group('CODE SIGNING ARGS') + codesign_group.add_argument('--verify_signature', action='store_true', default=False, help="Code Signature verification (if the contents of the binary have been modified)") + codesign_group.add_argument('--cd_info', action='store_true', default=False, help="Print Code Signature information") + codesign_group.add_argument('--cd_requirements', action='store_true', default=False, help="Print Code Signature Requirements") + codesign_group.add_argument('--entitlements', help="Print Entitlements in a human-readable, XML, or DER format (default: human)", nargs='?', const='human', metavar='human|xml|var') + codesign_group.add_argument('--extract_cms', help="Extract CMS Signature from the Code Signature and save it to a given file", metavar='cms_signature.der') + codesign_group.add_argument('--extract_certificates', help="Extract Certificates and save them to a given file. To each filename will be added an index at the end: _0 for signing, _1 for intermediate, and _2 for root CA certificate", metavar='certificate_name') + codesign_group.add_argument('--remove_sig', help="Save the new file on a disk with removed signature", metavar='unsigned_binary') + codesign_group.add_argument('--sign_binary', help="Sign binary using specified identity - use : 'security find-identity -v -p codesigning' to get the identity (default: adhoc)", nargs='?', const='adhoc', metavar='adhoc|identity') + + def addChecksecArgs(self): + checksec_group = self.parser.add_argument_group('CHECKSEC ARGS') + checksec_group.add_argument('--has_pie', action='store_true', default=False, help="Check if Position-Independent Executable (PIE) is set") + checksec_group.add_argument('--has_arc', action='store_true', default=False, help="Check if Automatic Reference Counting (ARC) is in use (can be false positive)") + checksec_group.add_argument('--is_stripped', action='store_true', default=False, help="Check if binary is stripped") + checksec_group.add_argument('--has_canary', action='store_true', default=False, help="Check if Stack Canary is in use (can be false positive)") + checksec_group.add_argument('--has_nx_stack', action='store_true', default=False, help="Check if stack is non-executable (NX stack)") + checksec_group.add_argument('--has_nx_heap', action='store_true', default=False, help="Check if heap is non-executable (NX heap)") + checksec_group.add_argument('--has_xn', action='store_true', default=False, help="Check if binary is protected by eXecute Never (XN) ARM protection") + checksec_group.add_argument('--is_notarized', action='store_true', default=False, help="Check if the application is notarized and can pass the Gatekeeper verification") + checksec_group.add_argument('--is_encrypted', action='store_true', default=False, help="Check if the application is encrypted (has LC_ENCRYPTION_INFO(_64) and cryptid set to 1)") + checksec_group.add_argument('--is_restricted', action='store_true', default=False, help="Check if binary has __RESTRICT segment or CS_RESTRICT flag set") + checksec_group.add_argument('--is_hr', action='store_true', default=False, help="Check if the Hardened Runtime is in use") + checksec_group.add_argument('--is_as', action='store_true', default=False, help="Check if the App Sandbox is in use") + checksec_group.add_argument('--is_fort', action='store_true', default=False, help="Check if the binary is fortified") + checksec_group.add_argument('--has_rpath', action='store_true', default=False, help="Check if the binary utilise any @rpath variables") + checksec_group.add_argument('--has_lv', action='store_true', default=False, help="Check if the binary has Library Validation (protection against Dylib Hijacking)") + checksec_group.add_argument('--checksec', action='store_true', default=False, help="Run all checksec module options on the binary") + + def addDylibsArgs(self): + dylibs_group = self.parser.add_argument_group('DYLIBS ARGS') + dylibs_group.add_argument('--dylibs', action='store_true', default=False, help="Print shared libraries used by specified binary with compatibility and the current version (loading paths unresolved, like @rpath/example.dylib)") + dylibs_group.add_argument('--rpaths', action='store_true', default=False, help="Print all paths (resolved) that @rpath can be resolved to") + dylibs_group.add_argument('--rpaths_u', action='store_true', default=False, help="Print all paths (unresolved) that @rpath can be resolved to") + dylibs_group.add_argument('--dylibs_paths', action='store_true', default=False, help="Print absolute dylib loading paths (resolved @rpath|@executable_path|@loader_path) in order they are searched for") + dylibs_group.add_argument('--dylibs_paths_u', action='store_true', default=False, help="Print unresolved dylib loading paths.") + dylibs_group.add_argument('--broken_relative_paths', action='store_true', default=False, help="Print 'broken' relative paths from the binary (cases where the dylib source is specified for an executable directory without @executable_path)") + dylibs_group.add_argument('--dylibtree', metavar=('cache_path,output_path,is_extracted'), nargs = '?', const=",,0", help='Print the dynamic dependencies of a Mach-O binary recursively. You can specify the Dyld Shared Cache path in the first argument, the output directory as the 2nd argument, and if you have already extracted DSC in the 3rd argument (0 or 1). The output_path will be used as a base for dylibtree. For example, to not extract DSC, use: --dylibs ",,1", or to extract from default to default use just --dylibs or --dylibs ",,0" which will extract DSC to extracted_dyld_share_cache/ in the current directory') + dylibs_group.add_argument('--dylib_id', action='store_true', default=False, help="Print path from LC_ID_DYLIB") + dylibs_group.add_argument('--reexport_paths', action='store_true', default=False, help="Print paths from LC_REEXPORT_DLIB") + dylibs_group.add_argument('--hijack_sec', action='store_true', default=False, help="Check if binary is protected against Dylib Hijacking") + dylibs_group.add_argument('--dylib_hijacking', metavar='(optional) cache_path' ,nargs="?", const="default", help="Check for possible Direct and Indirect Dylib Hijacking loading paths. The output is printed to console and saved in JSON format to /tmp/dylib_hijacking_log.json(append mode). Optionally, specify the path to the Dyld Shared Cache") + dylibs_group.add_argument('--dylib_hijacking_a', metavar='cache_path' ,nargs="?", const="default", help="Like --dylib_hijacking, but shows only possible vectors (without protected binaries)") + dylibs_group.add_argument('--prepare_dylib', metavar='(optional) target_dylib_name', nargs="?", const='', help="Compile rogue dylib. Optionally, specify target_dylib_path, it will search for the imported symbols from it in the dylib specified in the --path argument and automatically add it to the source code of the rogue lib. Example: --path lib1.dylib --prepare_dylib /path/to/lib2.dylib") + + def addDyldArgs(self): + dyld_group = self.parser.add_argument_group('DYLD ARGS') + dyld_group.add_argument('--is_built_for_sim', action='store_true', default=False, help="Check if binary is built for simulator platform.") + dyld_group.add_argument('--get_dyld_env', action='store_true', default=False, help="Extract Dyld environment variables from the loader binary.") + dyld_group.add_argument('--compiled_with_dyld_env', action='store_true', default=False, help="Check if binary was compiled with -dyld_env flag and print the environment variables and its values.") + dyld_group.add_argument('--has_interposing', action='store_true', default=False, help="Check if binary has interposing sections.") + dyld_group.add_argument('--interposing_symbols', action='store_true', default=False, help="Print interposing symbols if any.") + + def addAMFIArgs(self): + dyld_group = self.parser.add_argument_group('AMFI ARGS') + dyld_group.add_argument('--dump_prelink_info', metavar='(optional) out_name', nargs="?", const='PRELINK_info.txt', help='Dump "__PRELINK_INFO,__info" to a given file (default: "PRELINK_info.txt")') + dyld_group.add_argument('--dump_prelink_text', metavar='(optional) out_name', nargs="?", const='PRELINK_text.txt', help='Dump "__PRELINK_TEXT,__text" to a given file (default: "PRELINK_text.txt")') + dyld_group.add_argument('--amfi', action='store_true', default=False, help="a") + + + + def parseArgs(self): + return self.parser.parse_args() + + def printAllArgs(self, args): + '''Just for debugging. This method is a utility designed to print all parsed arguments and their corresponding values.''' + for arg, value in vars(args).items(): + print(f"{arg}: {value}") + +### --- SOURCE CODE --- ### +class SourceCodeManager: + dylib_hijacking = r''' +// clang -dynamiclib m.c -o m.dylib //-o $PWD/TARGET_DYLIB +#include +#include +#include +#include + +__attribute__((constructor)) +void myconstructor(int argc, const char **argv) +{ + syslog(LOG_ERR, "[+] m.dylib injected in %s\n", argv[0]); + printf("[+] m.dylib injected in %s\n", argv[0]); + setuid(0); + system("id"); + //system("/bin/sh"); +} +''' + @staticmethod + def clangCompilerWrapper(file_name_c, source_code, output_filename, flag_list=None): + # Save the source code to a file + with open(file_name_c, "w") as source_file: + source_file.write(source_code) + + # Compile the source code using clang + clang_command = ["clang", file_name_c, "-o", output_filename, *flag_list] + subprocess.run(clang_command, check=True) + +if __name__ == "__main__": + arg_parser = ArgumentParser() + args = arg_parser.parseArgs() + + file_path = os.path.abspath(args.path) + + ### --- I. MACH-O --- ### + macho_processor = MachOProcessor(file_path) + macho_processor.process(args) + + ### --- II. CODE SIGNING --- ### + code_signing_processor = CodeSigningProcessor() + code_signing_processor.process(args) + + ### --- III. CHECKSEC --- ### + checksec_processor = ChecksecProcessor() + checksec_processor.process(args) + + ### --- IV. DYLIBS --- ### + dylibs_processor = DylibsProcessor() + dylibs_processor.process(args) + + ### --- V. DYLD --- ### + dyld_processor = DyldProcessor() + dyld_processor.process(args) + + ### --- VI. AMFI --- ### + amfi_processor = AMFIProcessor() + amfi_processor.process(args) \ No newline at end of file