import enum
import subprocess
import logging
from idascript import IDA_BINARY
from pathlib import Path
from multiprocessing import Pool, Queue, Manager
import queue
import os
from typing import List, Optional, Iterable, Union, Generator
TIMEOUT_RETURNCODE: int = -1
[docs]
class IDAException(Exception):
"""
Base class for exceptions in the module.
"""
pass
[docs]
class IDANotStared(IDAException):
"""
This exception is raised when attempting
to call a function of the `IDA` class before
having called `start`.
"""
pass
[docs]
class IDAModeNotSet(IDAException):
"""
This exception is raised when the IDA Mode has not been set before calling `start`.
"""
pass
[docs]
class MultiIDAAlreadyRunning(IDAException):
"""
Exception raised if the `map` function of MultiIDA
is called while another map operation is still pending.
Design choices disallow launching two MultiIDA.map
function in the same time.
"""
pass
class IDAMode(enum.Enum):
"""
Different modes possible for the IDA class
"""
# Default value
NOTSET = enum.auto()
# Used when IDA will be launched for an IDAPython script
IDAPYTHON = enum.auto()
# Used when IDA will be launched directly
DIRECT = enum.auto()
[docs]
class IDA:
"""
Class representing an IDA execution on a given file
with a given script. This class is a wrapper to
subprocess IDA.
"""
def __init__(self,
binary_file: Union[Path, str],
script_file: Optional[Union[str, Path]] = None,
script_params: Optional[List[str]] = None,
timeout: Optional[float] = None,
exit_virtualenv: bool = False):
"""
:param binary_file: path of the binary file to analyse
:param script_file: path to the Python script to execute on the binary (if required)
:param script_params: additional parameters to send either to the script or IDA directly
:param exit_virtualenv: exit current virtual env before calling IDA
"""
if not Path(binary_file).exists():
raise FileNotFoundError("Binary file: %s" % binary_file)
self.bin_file: Path = Path(binary_file).resolve() #: File to the binary
self._process = None
self.script_file: Optional[Path] = None #: script file to execute
self.params: List[str] = [] #: list of paramaters given to IDA
self.timeout: Optional[float] = timeout #: Timeout for IDA execution
self.exit_virtualenv: bool = exit_virtualenv
if script_file is not None: # Mode IDAPython
self._set_idapython(script_file, script_params)
else: # Direct mode
self._set_direct(script_params)
def _set_idapython(self, script_file: Union[Path, str], script_params: List[str] = None) -> None:
"""
Set IDAPython script parameter.
:param script_file: path to the script to execute on the binary file
:param script_params: additional parameters sent to the script (available via idc.ARGV in idapython)
"""
if not Path(script_file).exists():
raise FileNotFoundError("Script file: %s" % script_file)
if script_params is None:
script_params = []
if script_params:
if not isinstance(script_params, list):
raise TypeError("script_params parameter should be a list")
self.script_file = Path(script_file).resolve()
self.params = [x.replace('"', '\\"') for x in script_params] if script_params else []
self.mode = IDAMode.IDAPYTHON
def _set_direct(self, script_options: List[str]) -> None:
"""
Set parameters script in direct mode
:param script_options: List of script options
:return: None
"""
for option in script_options:
if ':' not in option:
raise TypeError('Options must have a ":"')
self.params.append(f'-O{option}')
self.mode = IDAMode.DIRECT
[docs]
def start(self) -> None:
"""
Start the IDA process on the binary.
"""
cmd_line = [IDA_BINARY.as_posix(), '-A']
if self.mode == IDAMode.IDAPYTHON:
params = " "+" ".join(self.params) if self.params else ""
cmd_line.append('-S%s%s' % (self.script_file.as_posix(), params))
elif self.mode == IDAMode.DIRECT:
cmd_line.extend(self.params)
else:
raise
cmd_line.append(self.bin_file.as_posix())
logging.debug(f"run: {' '.join(cmd_line)}")
env = os.environ
env["TVHEADLESS"] = "1"
env["TERM"] = "xterm"
if self.exit_virtualenv:
venv = env.pop("VIRTUAL_ENV", None)
if venv:
paths = env["PATH"].split(":")
env["PATH"] = ":".join(x for x in paths if venv not in x)
self._process = subprocess.Popen(
cmd_line,
stdout=subprocess.DEVNULL,
stderr=subprocess.DEVNULL,
# See `https://www.hex-rays.com/blog/igor-tip-of-the-week-08-batch-mode-under-the-hood/`_
env=env
)
@property
def returncode(self) -> Optional[int]:
"""
Get the returncode of the process. Raise IDANotStart
if called before launching the process.
"""
if self._process:
return self._process.returncode
else:
raise IDANotStared()
@property
def terminated(self) -> bool:
"""
Boolean function returning True if the process is terminated
"""
if self._process:
if self._process.poll() is not None:
return True
else:
return False
else:
raise IDANotStared()
@property
def pid(self) -> int:
"""
Returns the PID of the IDA process
:return: int (PID of the process)
"""
if self._process:
return self._process.pid
else:
raise IDANotStared()
[docs]
def wait(self) -> int:
"""
Wait for the process to finish. This function hangs until
the process terminate. A timeout can be given which raises
TimeoutExpired if the timeout is exceeded (subprocess mechanism).
"""
if self._process:
try:
return self._process.wait(self.timeout)
except subprocess.TimeoutExpired:
self._process.terminate()
return TIMEOUT_RETURNCODE
else:
raise IDANotStared()
[docs]
def terminate(self) -> None:
"""
Call terminate on the IDA process (kill -15)
"""
if self._process:
self._process.terminate()
else:
raise IDANotStared()
[docs]
def kill(self) -> None:
"""
Call kill on the IDA subprocess (kill -9)
"""
if self._process:
self._process.kill()
else:
raise IDANotStared()
[docs]
class MultiIDA:
"""
Class to trigger multiple IDA processes concurrently
on a bunch of files.
"""
@staticmethod
def _worker(ingress, egress, script_file, params, timeout, exit_virtualenv) -> None:
while True:
try:
file = ingress.get(timeout=0.5)
ida = IDA(file, script_file, params, timeout, exit_virtualenv)
ida.start()
res = ida.wait()
egress.put((file, res))
except queue.Empty:
pass
except KeyboardInterrupt:
break
[docs]
@staticmethod
def map(generator: Iterable[Path],
script: Union[str, Path] = None,
params: List[str] = None,
workers: int = None,
timeout: Optional[float] = None,
exit_virtualenv: bool = False) -> Generator[tuple[int, Path], None, None]:
"""
Iterator the generator sent and apply the script file on each
file concurrently on a bunch of IDA workers. The function consume
the generator as fast as it can occupy all the workers and yield a
tuple (return code, path file) everytime an IDA process as terminated.
:param generator: Iterable of file paths strings (or Path)
:param script: path to the script to execute
:param params: list of parameters to send to the script
:param workers: number of workers to trigger in parallel
:param timeout: timeout for IDA runs (-1 means infinity)
:param exit_virtualenv: exit current virtualenv before calling IDA
:return: generator of files processed (return code, file path)
"""
manager = Manager()
ingress = manager.Queue()
egress = manager.Queue()
pool = Pool(workers)
# Launch all workers
for i in range(workers):
pool.apply_async(MultiIDA._worker, (ingress, egress, script, params, timeout, exit_virtualenv))
# Pre-fill ingress queue
total = 0
for file in generator:
ingress.put(file)
total += 1
i = 0
while True:
path, res = egress.get()
i += 1
yield path, res
# once all items have been processed
if i == total:
break
pool.terminate()