Source code for vtrace.platforms.base

"""
Tracer Platform Base
"""
# Copyright (C) 2007 Invisigoth - See LICENSE file for details
import os
import struct
import vtrace
import traceback
import platform

from Queue import Queue
from threading import Thread,currentThread,Lock

import envi
import envi.memory as e_mem
import envi.threads as e_threads
import envi.resolver as e_resolv

import vstruct.builder as vs_builder

[docs]class TracerBase(vtrace.Notifier): """ The basis for a tracer's internals. All platformFoo/archFoo functions are defaulted, and internal state is initialized. Additionally, a number of internal utilities are housed here. """ def __init__(self): """ The routine to initialize a tracer's initial internal state. This is used by the initial creation routines, AND on attaches/executes to re-fresh the state of the tracer. WARNING: This will erase all metadata/symbols (modes/notifiers are kept) """ vtrace.Notifier.__init__(self) self.pid = 0 # Attached pid (also used to know if attached) self.exited = False self.breakpoints = {} self.newbreaks = [] self.bpbyid = {} self.bpid = 0 self.curbp = None self.bplock = Lock() self.deferred = [] self.running = False self.runagain = False self.attached = False # A cache for memory maps and fd listings self.mapcache = None self.thread = None # our proxy thread... self.threadcache = None self.fds = None self.signal_ignores = [] self.localvars = {} # Set if we are RunForever until a thread exit... self._join_thread = None self._break_after_bp = True # Do we stop on the instruction *after* the bp? self.vsbuilder = vs_builder.VStructBuilder() self.psize = self.getPointerSize() # From the envi arch mod... # Track which libraries are parsed, and their # normame to full path mappings self.libloaded = {} # True if the library has been loaded already self.libpaths = {} # normname->filename and filename->normname lookup # Set up some globally expected metadata self.setMeta('PendingSignal', None) self.setMeta('SignalInfo', None) self.setMeta("IgnoredSignals",[]) self.setMeta("LibraryBases", {}) # name -> base address mappings for binaries self.setMeta("LibraryPaths", {}) # base -> path mappings for binaries self.setMeta("ThreadId", 0) # If you *can* have a thread id put it here plat = platform.system() rel = platform.release() self.setMeta("Platform", plat) self.setMeta("Release", rel) # Use this if we are *expecting* a break # which is caused by us (so we remove the # SIGBREAK from pending_signal self.setMeta("ShouldBreak", False)
[docs] def nextBpId(self): self.bplock.acquire() x = self.bpid self.bpid += 1 self.bplock.release() return x
def _justAttached(self, pid): # Used by the top level Trace after platform routines self.pid = pid self.attached = True self.breakpoints = {} self.bpbyid = {} self.setMeta("PendingSignal", None) self.setMeta("ExitCode", 0) self.exited = False
[docs] def getResolverForFile(self, filename): res = self.resbynorm.get(filename, None) if res: return res res = self.resbyfile.get(filename, None) if res: return res return None
[docs] def steploop(self): """ Continue stepi'ing in a loop until shouldRunAgain() returns false (like RunForever mode or something) """ if self.getMode("NonBlocking", False): e_threads.firethread(self.doStepLoop)() else: self.doStepLoop()
[docs] def doStepLoop(self): go = True while go: self.stepi() go = self.shouldRunAgain()
def _doRun(self): # Exists to avoid recursion from loop in doWait self.requireAttached() self.requireNotRunning() self.requireNotExited() fastbreak = False if self.curbp: fastbreak = self.curbp.fastbreak # If we are on a breakpoint, and it's a fastbreak # we don't want to fire a "continue" event. if not fastbreak: self.fireNotifiers(vtrace.NOTIFY_CONTINUE) # Step past a breakpoint if we are on one. self._checkForBreak() # Throw down and activate breakpoints... if not fastbreak: self._throwdownBreaks() self.running = True self.runagain = False self._syncRegs() # Must be basically last... self.platformContinue() self.setMeta("PendingSignal", None)
[docs] def wait(self): """ Wait for the trace target to have something happen... If the trace is in NonBlocking mode, this will fire a thread to wait for you and return control immediately. """ if self.getMode("NonBlocking"): e_threads.firethread(self._doWait)() else: self._doWait()
def _doWait(self): doit = True while doit: # A wrapper method for wait() and the wait thread to use self.setMeta('SignalInfo', None) self.setMeta('PendingSignal', None) event = self.platformWait() self.running = False self.platformProcessEvent(event) doit = self.shouldRunAgain() if doit: self._doRun() def _fireSignal(self, signo, siginfo=None): self.setMeta('PendingSignal', signo) self.setMeta('SignalInfo', siginfo) self.fireNotifiers(vtrace.NOTIFY_SIGNAL) def _fireExit(self, ecode): self.setMeta('ExitCode', ecode) self.fireNotifiers(vtrace.NOTIFY_EXIT) def _fireExitThread(self, threadid, ecode): self.setMeta('ExitThread', threadid) self.setMeta('ExitCode', ecode) self.fireNotifiers(vtrace.NOTIFY_EXIT_THREAD) def _activateBreak(self, bp): # NOTE: This is special cased by hardware debuggers etc... if bp.isEnabled(): try: bp.activate(self) except Exception, e: traceback.print_exc() print "WARNING: bpid %d activate failed (deferring): %s" % (bp.id, e) self.deferred.append(bp) def _throwdownBreaks(self): """ Run through the breakpoints and setup the ones that are enabled. NOTE: This should *not* get called when continuing from a fastbreak... """ # Resolve deferred breaks for bp in self.deferred: addr = bp.resolveAddress(self) if addr != None: self.deferred.remove(bp) self.breakpoints[addr] = bp for bp in self.breakpoints.values(): self._activateBreak(bp) def _syncRegs(self): """ Sync the reg-cache into the target process """ if self.regcache != None: for tid, ctx in self.regcache.items(): if ctx.isDirty(): self.platformSetRegCtx(tid, ctx) self.regcache = None def _cacheRegs(self, threadid): """ Make sure the reg-cache is populated """ if self.regcache == None: self.regcache = {} ret = self.regcache.get(threadid) if ret == None: ret = self.platformGetRegCtx(threadid) ret.setIsDirty(False) self.regcache[threadid] = ret return ret def _checkForBreak(self): """ Check to see if we've landed on a breakpoint, and if so deactivate and step us past it. WARNING: Unfortunatly, cause this is used immidiatly before a call to run/wait, we must block briefly even for the GUI """ # Steal a reference because the step should # clear curbp... bp = self.curbp if bp != None and bp.isEnabled(): if bp.active: bp.deactivate(self) orig = self.getMode("FastStep") self.setMode("FastStep", True) self.stepi() self.setMode("FastStep", orig) bp.activate(self) self.curbp = None
[docs] def shouldRunAgain(self): """ A unified place for the test as to weather this trace should be told to run again after reaching some stopping condition. """ if not self.attached: return False if self.exited: return False if self.getMode("RunForever"): return True if self.runagain: return True return False
def __repr__(self): run = "stopped" exe = "None" if self.isRunning(): run = "running" elif self.exited: run = "exited" exe = self.getMeta("ExeName") return "[%d]\t- %s <%s>" % (self.pid, exe, run)
[docs] def initMode(self, name, value, descr): """ Initialize a mode, this should ONLY be called during setup routines for the trace! It determines the available mode setings. """ self.modes[name] = bool(value) self.modedocs[name] = descr
[docs] def release(self): """ Do cleanup when we're done. This is mostly necissary because of the thread proxy holding a reference to this tracer... We need to let him die off and try to get garbage collected. """ if self.thread: self.thread.go = False
def _cleanupResources(self): self._tellThreadExit() def _tellThreadExit(self): if self.thread != None: self.thread.queue.put(None) self.thread.join(timeout=2) self.thread = None def __del__(self): if not self._released: print 'Warning! tracer del w/o release()!'
[docs] def fireTracerThread(self): # Fire the threadwrap proxy thread for this tracer # (if it hasnt been fired...) if self.thread == None: self.thread = TracerThread()
[docs] def fireNotifiers(self, event): """ Fire the registered notifiers for the NOTIFY_* event. """ if event == vtrace.NOTIFY_SIGNAL: signo = self.getCurrentSignal() if signo in self.getMeta("IgnoredSignals", []): if vtrace.verbose: print "Ignoring",signo self.runAgain() return alllist = self.getNotifiers(vtrace.NOTIFY_ALL) nlist = self.getNotifiers(event) trace = self # if the trace has a proxy it's notifiers # need that, cause we can't be pickled ;) if self.proxy: trace = self.proxy # First we notify ourself.... self.handleEvent(event, self) # The "NOTIFY_ALL" guys get priority for notifier in alllist: try: notifier.handleEvent(event,trace) except: print "WARNING: Notifier exception for",repr(notifier) traceback.print_exc() for notifier in nlist: try: notifier.handleEvent(event,trace) except: print "WARNING: Notifier exception for",repr(notifier) traceback.print_exc()
def _cleanupBreakpoints(self): ''' Cleanup all breakpoints (if the current bp is "fastbreak" this routine will not be called... ''' for bp in self.breakpoints.itervalues(): bp.deactivate(self) def _fireStep(self): if self.getMode('FastStep', False): return self.fireNotifiers(vtrace.NOTIFY_STEP) def _fireBreakpoint(self, bp): self.curbp = bp # A breakpoint should be inactive when fired # (even fastbreaks, we'll need to deactivate for stepi anyway) bp.deactivate(self) try: bp.notify(vtrace.NOTIFY_BREAK, self) except Exception, msg: traceback.print_exc() print "Breakpoint Exception 0x%.8x : %s" % (bp.address,msg) if not bp.fastbreak: self.fireNotifiers(vtrace.NOTIFY_BREAK) else: # fastbreak's are basically always "run again" self.runagain = True
[docs] def checkPageWatchpoints(self): """ Check if the given memory fault was part of a valid MapWatchpoint. """ faultaddr,faultperm = self.platformGetMemFault() #FIXME this is some AWESOME but intel specific nonsense if faultaddr == None: return False faultpage = faultaddr & 0xfffff000 wp = self.breakpoints.get(faultpage, None) if wp == None: return False self._fireBreakpoint(wp) return True
[docs] def checkWatchpoints(self): # Check for hardware watchpoints waddr = self.archCheckWatchpoints() if waddr != None: wp = self.breakpoints.get(waddr, None) self._fireBreakpoint(wp) return True
[docs] def checkBreakpoints(self): """ This is mostly for systems (like linux) where you can't tell the difference between some SIGSTOP/SIGBREAK conditions and an actual breakpoint instruction. This method will return true if either the breakpoint subsystem or the sendBreak (via ShouldBreak meta) is true (and it will have handled firing events for the bp) """ pc = self.getProgramCounter() if self._break_after_bp: bi = self.archGetBreakInstr() pc -= len(bi) bp = self.breakpoints.get(pc, None) if bp: addr = bp.getAddress() # Step back one instruction to account break self.setProgramCounter(addr) self._fireBreakpoint(bp) return True if self.getMeta("ShouldBreak"): self.setMeta("ShouldBreak", False) self.fireNotifiers(vtrace.NOTIFY_BREAK) return True return False
[docs] def notify(self, event, trace): """ We are frequently a notifier for ourselves, so we can do things like handle events on attach and on break in a unified fashion. """ self.threadcache = None self.mapcache = None self.fds = None self.running = False if event in self.auto_continue: self.runAgain() # For thread exits, make sure the tid # isn't in if event == vtrace.NOTIFY_EXIT_THREAD: tid = self.getMeta("ThreadId") self.sus_threads.pop(tid, None) # Check if this is a thread we were waiting on. if tid == self._join_thread: self._join_thread = None # Turn off the RunForever in joinThread() self.setMode('RunForever', False) # Either way, we don't want to run again... self.runAgain(False) # Do the stuff we do for detach/exit or # cleanup breaks etc... if event == vtrace.NOTIFY_ATTACH: pass elif event == vtrace.NOTIFY_DETACH: for tid in self.sus_threads.keys(): self.resumeThread(tid) self._cleanupBreakpoints() elif event == vtrace.NOTIFY_EXIT: self.setMode("RunForever", False) self.exited = True self.attached = False elif event == vtrace.NOTIFY_CONTINUE: self.runagain = False else: self._cleanupBreakpoints()
[docs] def delLibraryBase(self, baseaddr): libname = self.getMeta("LibraryPaths").get(baseaddr, "unknown") normname = self.normFileName(libname) sym = self.getSymByName(normname) self.setMeta("LatestLibrary", libname) self.setMeta("LatestLibraryNorm", normname) self.fireNotifiers(vtrace.NOTIFY_UNLOAD_LIBRARY) self.getMeta("LibraryBases").pop(normname, None) self.getMeta("LibraryPaths").pop(baseaddr, None) if sym != None: self.delSymbol(sym)
[docs] def addLibraryBase(self, libname, address, always=False): """ This should be used *at load time* to setup the library event metadata. This *must* be called from a context where it's safe to fire notifiers, because it will fire a notifier to alert about a LOAD_LIBRARY. (This means *not* from inside another notifer) """ self.setMeta("LatestLibrary", None) self.setMeta("LatestLibraryNorm", None) normname = self.normFileName(libname) if self.getSymByName(normname) != None: normname = "%s_%.8x" % (normname,address) # Only actually do library work with a file or force if os.path.exists(libname) or always: self.getMeta("LibraryPaths")[address] = libname self.getMeta("LibraryBases")[normname] = address self.setMeta("LatestLibrary", libname) self.setMeta("LatestLibraryNorm", normname) width = self.arch.getPointerSize() sym = e_resolv.FileSymbol(normname, address, 0, width=width) sym.casesens = self.casesens self.addSymbol(sym) self.libpaths[normname] = libname self.fireNotifiers(vtrace.NOTIFY_LOAD_LIBRARY)
[docs] def normFileName(self, libname): basename = os.path.basename(libname) return basename.split(".")[0].split("-")[0].lower()
def _findLibraryMaps(self, magic, always=False): # A utility for platforms which lack library load # notification through the operating system done = {} mlen = len(magic) for addr,size,perms,fname in self.getMemoryMaps(): if not fname: continue if done.get(fname): continue try: if self.readMemory(addr, mlen) == magic: done[fname] = True self.addLibraryBase(fname, addr, always=always) except: pass # *never* do this... except this once... def _loadBinaryNorm(self, normname): if not self.libloaded.get(normname, False): fname = self.libpaths.get(normname) if fname != None: self._loadBinary(fname) return True return False def _loadBinary(self, filename): """ Check if a filename has yet to be parsed. If it has NOT been parsed, parse it and return True, otherwise, return False """ normname = self.normFileName(filename) if not self.libloaded.get(normname, False): address = self.getMeta("LibraryBases").get(normname) if address != None: self.platformParseBinary(filename, address, normname) self.libloaded[normname] = True return True return False def _simpleCreateThreads(self): ''' Fire a thread event for each of the current threads. (for use by tracers which don't get help from the OS) ''' initid = self.getMeta('ThreadId') for tid in self.platformGetThreads().keys(): self.setMeta('ThreadId', tid) self.fireNotifiers(vtrace.NOTIFY_CREATE_THREAD) self.setMeta('ThreadId', initid) ####################################################################### # # NOTE: all platform/arch defaults are populated here. #
[docs] def platformGetThreads(self): """ Return a dictionary of <threadid>:<tinfo> pairs where tinfo is either the stack top, or the teb for win32 """ raise Exception("Platform must implement platformGetThreads()")
[docs] def platformSelectThread(self, thrid): """ Platform implementers are encouraged to use the metadata field "ThreadId" as the identifier (int) for which thread has "focus". Additionally, the field "StoppedThreadId" should be used in instances (like win32) where you must specify the ORIGINALLY STOPPED thread-id in the continue. """ self.setMeta("ThreadId",thrid)
[docs] def platformSuspendThread(self, thrid): raise Exception("Platform must implement platformSuspendThread()")
[docs] def platformResumeThread(self, thrid): raise Exception("Platform must implement platformResumeThread()")
[docs] def platformInjectThread(self, pc, arg=0): raise Exception("Platform must implement platformInjectThread()")
[docs] def platformKill(self): raise Exception("Platform must implement platformKill()")
[docs] def platformExec(self, cmdline): """ Platform exec will execute the process specified in cmdline and return the PID """ raise Exception("Platmform must implement platformExec")
[docs] def platformInjectSo(self, filename): raise Exception("Platform must implement injectso()")
[docs] def platformGetFds(self): """ Return what getFds() wants for this particular platform """ raise Exception("Platform must implement platformGetFds()")
[docs] def platformGetSignal(self): ''' Return the currently posted exception/signal.... ''' # Default to the thing they all should do... return self.getMeta('PendingSignal', None)
[docs] def platformSetSignal(self, sig=None): ''' Set the current signal to deliver to the process on cont. (Use None for no signal delivery. ''' self.setMeta('PendingSignal', sig)
[docs] def platformGetMaps(self): """ Return a list of the memory maps where each element has the following structure: (address, length, perms, file="") NOTE: By Default this list is available as Trace.maps because the default implementation attempts to populate them on every break/stop/etc... """ raise Exception("Platform must implement GetMaps")
[docs] def platformPs(self): """ Actually return a list of tuples in the format (pid, name) for this platform """ raise Exception("Platform must implement Ps")
[docs] def archGetStackTrace(self): raise Exception("Architecure must implement argGetStackTrace()!")
[docs] def archAddWatchpoint(self, address, size=4, perms="rw"): """ Add a watchpoint for the given address. Raise if the platform doesn't support, or too many are active... """ raise Exception("Architecture doesn't implement watchpoints!")
[docs] def archRemWatchpoint(self, address): raise Exception("Architecture doesn't implement watchpoints!")
[docs] def archCheckWatchpoints(self): """ If the current register state indicates that a watchpoint was hit, return the address of the watchpoint and clear the event. Otherwise return None """ pass
[docs] def archGetRegCtx(self): """ Return a new empty envi.registers.RegisterContext object for this trace. """ raise Exception("Platform must implement archGetRegCtx()")
[docs] def getStackTrace(self): """ Return a list of the stack frames for this process (currently Intel/ebp based only). Each element of the "frames list" consists of another list which is (eip,ebp) """ raise Exception("Platform must implement getStackTrace()")
[docs] def getExe(self): """ Get the full path to the main executable for this *attached* Trace """ return self.getMeta("ExeName","Unknown")
[docs] def platformAttach(self, pid): """ Actually carry out attaching to a target process. Like platformStepi this is expected to be ATOMIC and not return until a complete attach. """ raise Exception("Platform must implement platformAttach()")
[docs] def platformContinue(self): raise Exception("Platform must implement platformContinue()")
[docs] def platformDetach(self): """ Actually perform the detach for this type """ raise Exception("Platform must implement platformDetach()")
[docs] def platformStepi(self): """ PlatformStepi should be ATOMIC, meaning it gets called, and by the time it returns, you're one step further. This is completely regardless of blocking/nonblocking/whatever. """ raise Exception("Platform must implement platformStepi!")
[docs] def platformCall(self, address, args, convention=None): """ Platform call takes an address, and an array of args (string types will be mapped and located for you) platformCall is expected to return a dicionary of the current register values at the point where the call has returned... """ raise Exception("Platform must implement platformCall")
[docs] def platformGetRegCtx(self, threadid): raise Exception("Platform must implement platformGetRegCtx!")
[docs] def platformSetRegCtx(self, threadid, ctx): raise Exception("Platform must implement platformSetRegCtx!")
[docs] def platformProtectMemory(self, va, size, perms): raise Exception("Plaform does not implement protect memory")
[docs] def platformAllocateMemory(self, size, perms=e_mem.MM_RWX, suggestaddr=0): raise Exception("Plaform does not implement allocate memory")
[docs] def platformReadMemory(self, address, size): raise Exception("Platform must implement platformReadMemory!")
[docs] def platformWriteMemory(self, address, bytes): raise Exception("Platform must implement platformWriteMemory!")
[docs] def platformGetMemFault(self): """ Return the addr of the current memory fault or None """ #NOTE: This is used by the PageWatchpoint subsystem # (and is still considered experimental) return None,None
[docs] def platformWait(self): """ Wait for something interesting to occur and return a *platform specific* representation of what happened. This will then be passed to the platformProcessEvent() method which will be responsible for doing things like firing notifiers. Because the platformWait() method needs to be commonly @threadwrap and you can't fire notifiers from within a threadwrapped function... """ raise Exception("Platform must implement platformWait!")
[docs] def platformProcessEvent(self, event): """ This method processes the event data provided by platformWait() This method is responsible for firing ALL notifiers *except*: vtrace.NOTIFY_CONTINUE - This is handled by the run api (and isn't the result of an event) """ raise Exception("Platform must implement platformProcessEvent")
[docs] def platformOpenFile(self, filename): # Open a file for reading return file(filename, 'rb')
[docs] def platformParseBinary(self, filename, baseaddr, normname): """ Platforms must parse the given binary file and load any symbols into the internal SymbolResolver using self.addSymbol() """ raise Exception("Platform must implement platformParseBinary")
[docs] def platformRelease(self): ''' Called back on release. ''' pass
import threading
[docs]def threadwrap(func): def trfunc(self, *args, **kwargs): if threading.currentThread().__class__ == TracerThread: return func(self, *args, **kwargs) # Proxy the call through a single thread q = Queue() # FIXME change calling convention! args = (self, ) + args self.thread.queue.put((func, args, kwargs, q)) ret = q.get() if issubclass(ret.__class__, Exception): raise ret return ret return trfunc
[docs]class TracerThread(Thread): """ Ok... so here's the catch... most debug APIs do *not* allow one thread to do the attach and another to do continue and another to do wait... they just dont. So there. I have to make a thread per-tracer (on most platforms) and proxy requests (for *some* trace API methods) to it for actual execution. SUCK! However, this lets async things like GUIs and threaded things like cobra not have to be aware of which one is allowed and not allowed to make particular calls and on what platforms... YAY! """ def __init__(self): Thread.__init__(self) self.queue = Queue() self.setDaemon(True) self.start()
[docs] def run(self): """ Run in a circle getting requests from our queue and executing them based on the thread. """ while True: try: qobj = self.queue.get() if qobj == None: break meth, args, kwargs, queue = qobj try: queue.put(meth(*args, **kwargs)) except Exception,e: queue.put(e) if vtrace.verbose: traceback.print_exc() continue except: if vtrace.verbose: traceback.print_exc()