[docs]defdecode_address(enc_address:int,code_length:int)->addr_t:""" Resolves an encoded address and returns the corresponding file offset. Args: enc_address (int): The encoded address to be resolved. code_length (int): The length of the bytecode file. Returns: int: The decoded address as an absolute file offset. """return((enc_address^~code_length)&0xFFFFFFFF)%code_length
# -----------------------------------------------------------------------------# Entry point decoding# -----------------------------------------------------------------------------defdecode_entry_point_v0(vm:"VM")->addr_t:a=vm.context.u32(addr=0x04)b01=(~a&0xFFFFFF8E)*-3+(~a|0xFFFFFF8E)b02=(a*2)^0xFFFFFF1Cprint((b01+b02)&0xFFFFFFFF)returnvm.context.addr((b01+b02)&0xFFFFFFFF,rel=False)defdecode_entry_point_v1(vm:"VM")->addr_t:a=vm.context.u32(addr=0x04)returnvm.context.addr((a^0x44)+((a<<1)&0x88),rel=False)# -----------------------------------------------------------------------------# public field types# -----------------------------------------------------------------------------le_u64=le+uint64le_u32=le+uint32le_s32=le+int32le_u16=le+uint16# -----------------------------------------------------------------------------# Memory Management# -----------------------------------------------------------------------------classVMVariable:#: the human readable type of this variabletype:str|None#: the value associated with this variablevalue:Anyname:str#: the position of this variable in memory (file offset)__address_:addr_tdef__init__(self,addr:addr_t,ty:str|None=None,value:Any=None)->None:self.__address_=addrself.value=valueself.type=tyself.name="_"@propertydefaddress(self)->addr_t:returnself.__address_def__str__(self)->str:returnself.name
[docs]classVMMemory:"""Internal memory manager for the VM. This class keeps track of objects that are allocated on the heap using malloc(..). """#: INternal map that stores all objects that should be#: accessible.objects:dict[ptr_t,Any]#: Memory variablesvariables:dict[addr_t,VMVariable]#: Base address for this memory managerbase_address:ptr_t# Current address for allocating objects_alloc_pos:ptr_t
[docs]defalloc[T](self,ty:Type[T],*args,**kwargs)->tuple[ptr_t,T]:"""Simulates memory allocation by instantiating an object of the given type. This function stores a reference to the created object in the internal object map and resturns the target address together with the created object. """addr=self._alloc_posobj=ty(*args,**kwargs)self.objects[addr]=objself._alloc_pos+=8return(addr,obj)
[docs]defmalloc(self,size:int)->tuple[ptr_t,bytearray]:"""Simulates memory allocation by creating a bytearray using the given size."""addr=self._alloc_posobj=bytearray(size)self.objects[addr]=objself._alloc_pos+=sizereturn(addr,obj)
[docs]defu32(self,addr:addr_t=-1)->int:"""Reads an unsigned 32bit integer. Reads the integer from the current program counter if address is -1. Args: addr (int, optional): the target address. Defaults to -1. Returns: int: the parsed int """returnself.get(le_u32,addr)
[docs]defi32(self,addr:addr_t=-1)->int:"""Reads a signed 32bit integer. Reads the integer from the current program counter if address is -1. Args: addr (int, optional): the target address. Defaults to -1. Returns: int: the parsed int """returnself.get(le_s32,addr)
[docs]defu64(self,addr:addr_t=-1)->int:"""Reads an unsigned 64bit integer. Reads the integer from the current program counter if address is -1. Args: addr (int, optional): the target address. Defaults to -1. Returns: int: the parsed int """returnself.get(le_u64,addr)
[docs]defdouble(self,addr:addr_t=-1)->float:"""Reads a 64bit floating point value. Reads the value from the current program counter if address is -1. Args: addr (int, optional): the target address. Defaults to -1. Returns: float: the parsed double """returnself.get(le+double,addr)
[docs]defu16(self,addr:addr_t=-1,decode=False)->int:"""Reads an unsigned 16bit integer. Reads the integer from the current program counter if address is -1. Args: addr (int, optional): the target address. Defaults to -1. Returns: int: the parsed int """returnself.get(le+uint16,addr)
[docs]defaddr(self,off:int,rel=True,decode=True)->addr_t:"""Reads an encoded address relative to the current addres (default) Args: off (int): relative offset (absolute if rel=False) rel (bool, optional): whether off is relative. Defaults to True. decode (bool, optional): decodes the address after parsing. Defaults to True. Returns: int: the parsed address """address=self.u32(offifnotrelelseself.pc+off)ifdecode:returndecode_address(address,self.vm_code_length)returnaddress
[docs]classVMState:"""Tracks the internal state of the VM and stores environment options"""#: whether to print decompiled or disassembled outputverbose:bool#: Output writer (may be null)writer:Any#: controls whether the VM should stop executionshould_exit:bool#: comment start charactercomment:str#: internal mapping of variables used by the Decompiler or disassembler_env:dict[str,Any]# --- special methods ---
def__getitem__(self,key):returnself._env[key]def__setitem__(self,key,value):self._env[key]=value# --- debugging support ---
[docs]defpsection(self,name:str,*comments)->None:"""Writes a line to the terminal. Args: name (str): the section name """line=f".{name}:"self.pline(line,*comments)
[docs]defpinsn(self,insn:str,args:str,*comments:str,indent:int=1)->None:"""Writes an instruction to the terminal. Args: name (str): the line to write """line=(" "*indent)+f"{insn:<8}{args}"self.pline(line,*comments)
[docs]defpline(self,line,*args)->None:"""Writes a line to the terminal. Args: name (str): the line to write """iflen(args)>0:args=[self.comment]+list(args)ifself.verbose:self.writer(" ".join([f"{line:40s}"]+list(args)))
# -----------------------------------------------------------------------------# VM# -----------------------------------------------------------------------------classVM:#: internal state and environmentstate:VMState#: code and code positioncontext:VMContext#: memorymem:VMMemorydef__init__(self,bytecode:bytes,opcode_decoder_fn:OpcodeDecoderFn,entry_point_decode_fn:EntryPointDecoderFn,address_decoder_fn:AddressDecoderFn=decode_address,hash_verifier_fn:HashVerifierFn=verify_fnv,pc:addr_t=-1,mem_base_addr:ptr_t=-1,verbose:bool=False,writer:Any=print,**env,)->None:self.mem=VMMemory(mem_base_addrifmem_base_addr>=0else0xDEAD00000000)self.context=VMContext(bytecode,pc)self.state=VMState(verbose,writer,**env)self._entry_point_decoder=entry_point_decode_fnself._address_decoder=address_decoder_fnself._opcode_decoder=opcode_decoder_fnself._hash_verifier=hash_verifier_fndefentry_point(self)->addr_t:"""Calculates the entry point for the current program Returns: int: the entry point address (file offset) """ifnotself._entry_point_decoder:raiseValueError(f"{self.__class__.__name__} can't resolve entry point!")returnself._entry_point_decoder(self)defcurrent_opcode(self)->int:"""Returns the decoded opcode for the current pc. Returns: int: the decoded opcode """ifnotself._opcode_decoder:raiseValueError(f"{self.__class__.__name__} does not support decoding opcodes!")returnself._opcode_decoder(self.context.u16())# return decode_opcode(self.context.u16()) & 0xFFFFdefverify_hash(self,addr:addr_t=-1)->bool:""" Verifies the integrity of a section of the VM's code by checking its hash value. (Used to select the next instruction address) Args: addr (addr_t, optional): The address in the bytecode to verify. Defaults to the current program counter (pc) if not provided. Returns: bool: True if the hash verification is successful, False otherwise. """ifnotself._hash_verifier:raiseNotImplementedError(f"{self.__class__.__name__} does not implement hash verification!")returnself._hash_verifier(addr,self)