mirror of
https://github.com/dobin/SuperMega
synced 2026-06-02 17:27:10 +00:00
127 lines
4.4 KiB
Python
127 lines
4.4 KiB
Python
import sys
|
|
import pefile
|
|
import pprint
|
|
from keystone import Ks, KS_ARCH_X86, KS_MODE_64
|
|
from capstone import Cs, CS_ARCH_X86, CS_MODE_64, CS_MODE_LITTLE_ENDIAN
|
|
import logging
|
|
|
|
from model.defs import *
|
|
|
|
logger = logging.getLogger("PEHelper")
|
|
|
|
|
|
# PEHelper
|
|
# Work directly on PE files. Not using superpe or other abstractions.
|
|
# Its mostly used for verification of what we were doing.
|
|
|
|
|
|
def extract_code_from_exe_file_ep(exe_file: FilePath, len: int) -> bytes:
|
|
pe = pefile.PE(exe_file)
|
|
section = get_code_section(pe)
|
|
data: bytes = section.get_data()
|
|
data = remove_trailing_null_bytes(data)
|
|
ep = pe.OPTIONAL_HEADER.AddressOfEntryPoint
|
|
ep_raw = get_physical_address_tmp(pe, ep)
|
|
data = data[ep_raw:ep_raw+len]
|
|
pe.close()
|
|
return data
|
|
|
|
|
|
def get_physical_address_tmp(pe, virtual_address):
|
|
for section in pe.sections:
|
|
if section.VirtualAddress <= virtual_address < section.VirtualAddress + section.Misc_VirtualSize:
|
|
virtual_offset = virtual_address - section.VirtualAddress
|
|
physical_address = section.PointerToRawData + virtual_offset
|
|
return physical_address
|
|
return None
|
|
|
|
|
|
def extract_code_from_exe_file(exe_file: FilePath) -> bytes:
|
|
pe = pefile.PE(exe_file)
|
|
section = get_code_section(pe)
|
|
data: bytes = section.get_data()
|
|
data = remove_trailing_null_bytes(data)
|
|
logger.debug("---[ Extract code section size: {} / {}".format(
|
|
len(data), section.Misc_VirtualSize))
|
|
pe.close()
|
|
return data
|
|
|
|
|
|
def write_code_section(exe_file: FilePath, new_data: bytes):
|
|
pe = pefile.PE(exe_file)
|
|
section = get_code_section(pe)
|
|
file_offset = section.PointerToRawData
|
|
with open(exe_file, 'r+b') as f:
|
|
f.seek(file_offset)
|
|
f.write(new_data)
|
|
pe.close()
|
|
|
|
|
|
def get_code_section(pe: pefile.PE) -> pefile.SectionStructure:
|
|
entrypoint = pe.OPTIONAL_HEADER.AddressOfEntryPoint
|
|
for sect in pe.sections:
|
|
if sect.Characteristics & pefile.SECTION_CHARACTERISTICS['IMAGE_SCN_MEM_EXECUTE']:
|
|
if entrypoint >= sect.VirtualAddress and entrypoint <= sect.VirtualAddress + sect.Misc_VirtualSize:
|
|
return sect
|
|
raise Exception("pehelper::get_code_section(): Code section not found")
|
|
|
|
|
|
# keystone/capstone stuff
|
|
cs = Cs(CS_ARCH_X86, CS_MODE_64 + CS_MODE_LITTLE_ENDIAN)
|
|
|
|
def assemble_lea(current_address: int, destination_address: int, reg: str) -> bytes:
|
|
#print("LEAH: 0x{:X} - 0x{:X} = 0x{:X}".format(
|
|
# current_address, destination_address, destination_address - current_address))
|
|
offset = destination_address - current_address
|
|
ks = Ks(KS_ARCH_X86, KS_MODE_64)
|
|
encoding, _ = ks.asm(f"lea {reg}, qword ptr ds:[{offset}]")
|
|
machine_code = bytes(encoding)
|
|
return machine_code
|
|
|
|
|
|
def assemble_relative_call(current_address: int, destination_address: int) -> bytes:
|
|
# Calculate the relative offset
|
|
# For a near jump, the instruction length is typically 5 bytes (E9 xx xx xx xx)
|
|
offset = destination_address - current_address
|
|
|
|
# Assemble the jump instruction using Keystone
|
|
ks = Ks(KS_ARCH_X86, KS_MODE_64)
|
|
encoding, _ = ks.asm(f"call qword ptr ds:[{offset}]")
|
|
machine_code = bytes(encoding)
|
|
|
|
# Disassemble the machine code using Capstone
|
|
#cs = Cs(CS_ARCH_X86, CS_MODE_64)
|
|
#disassembled = next(cs.disasm(machine_code, current_address))
|
|
#logger.info(f"Machine Code: {' '.join(f'{byte:02x}' for byte in machine_code)}")
|
|
#logger.info(f"Disassembled: {disassembled.mnemonic} {disassembled.op_str}")
|
|
return machine_code
|
|
|
|
|
|
def assemble_relative_jmp(current_address: int, destination_address: int) -> bytes:
|
|
offset = destination_address - current_address
|
|
ks = Ks(KS_ARCH_X86, KS_MODE_64)
|
|
encoding, _ = ks.asm(f"jmp {offset}")
|
|
machine_code = bytes(encoding)
|
|
return machine_code
|
|
|
|
|
|
def asm_disasm(asm_text, offset=0):
|
|
for instr in cs.disasm(asm_text, offset):
|
|
printInstr(instr)
|
|
|
|
def printInstr(instr, depth=0):
|
|
_bytes = [f'{x:02x}' for x in instr.bytes[:8]]
|
|
if len(instr.bytes) < 8:
|
|
_bytes.extend([' ',] * (8 - len(instr.bytes)))
|
|
instrBytes = ' '.join([f'{x}' for x in _bytes])
|
|
logger.info('\t' * 1 + f' [{instr.address:08x}]\t{instrBytes}' + '\t' * depth + f'{instr.mnemonic}\t{instr.op_str}')
|
|
|
|
|
|
## Utils
|
|
|
|
def remove_trailing_null_bytes(data: bytes) -> bytes:
|
|
for i in range(len(data) - 1, -1, -1):
|
|
if data[i] != b'\x00'[0]: # Check for a non-null byte
|
|
return data[:i + 1]
|
|
return b'' # If the entire sequence is null bytes
|