Following PR #169744 the DAP launch sequencing of Dexter was changed to complete a launch request/response before performing configuration steps. This matches LLDB's current behaviour, but is not compatible with the DAP specification and causes issues interfacing with other debuggers. This patch tries to bridge the gap by using a sequencing that is mostly DAP-compliant while still interfacing correctly with lldb-dap: we send a launch request first, then perform all configuration steps and send configurationDone, and then await the launch response. For lldb-dap, we do not wait for the launch response and may send configuration requests before it is received, but lldb-dap appears to handle this without issue. For other debug adapters, the launch request will be ignored until the configurationDone request is received and responded to, at which point the launch request will be acted upon and responded to. As an additional note, the initialized event should be sent after the initialize response and before the launch request according to the spec, but as LLDB currently sends it after the launch response Dexter has avoided checking for it. Since the initialized event is now being sent after the launch response by LLDB, we can start checking for it earlier in the sequence as well (though technically the client should receive the initialized event before it sends the launch request).
973 lines
42 KiB
Python
973 lines
42 KiB
Python
# DExTer : Debugging Experience Tester
|
|
# ~~~~~~ ~ ~~ ~ ~~
|
|
#
|
|
# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
# See https://llvm.org/LICENSE.txt for license information.
|
|
# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
"""Interface for communicating with a debugger via the DAP.
|
|
"""
|
|
|
|
import abc
|
|
from collections import defaultdict
|
|
import copy
|
|
import json
|
|
import os
|
|
import shlex
|
|
import subprocess
|
|
import sys
|
|
import threading
|
|
import time
|
|
from enum import Enum
|
|
|
|
from dex.debugger.DebuggerBase import DebuggerBase, watch_is_active
|
|
from dex.dextIR import FrameIR, LocIR, StepIR, StopReason, ValueIR
|
|
from dex.dextIR import StackFrame, SourceLocation, ProgramState
|
|
from dex.utils.Exceptions import DebuggerException, LoadDebuggerException
|
|
from dex.utils.ReturnCode import ReturnCode
|
|
from dex.utils.Logging import Logger
|
|
from dex.utils.Timeout import Timeout
|
|
|
|
|
|
# Helper enum used for colorizing DAP Message Log output.
|
|
class Color(Enum):
|
|
CYAN = 36
|
|
GREEN = 32
|
|
YELLOW = 33
|
|
RED = 31
|
|
MAGENTA = 35
|
|
|
|
def apply(self, text: str) -> str:
|
|
return f"\033[{self.value}m{text}\033[0m"
|
|
|
|
|
|
class DAPMessageLogger:
|
|
def __init__(self, context):
|
|
self.dexter_logger = context.logger
|
|
self.log_file: str = context.options.dap_message_log
|
|
self.colorized: bool = context.options.colorize_dap_log
|
|
self.indent = 2 if context.options.format_dap_log == "pretty" else None
|
|
self.prefix_send: str = "->"
|
|
self.prefix_recv: str = "<-"
|
|
self.out_handle = None
|
|
self.open = False
|
|
self.lock = threading.Lock()
|
|
|
|
def _custom_enter(self):
|
|
self.open = True
|
|
if self.log_file is None:
|
|
return
|
|
if self.log_file == "-":
|
|
self.out_handle = sys.stdout
|
|
return
|
|
if self.log_file == "-e":
|
|
self.out_handle = sys.stderr
|
|
return
|
|
self.out_handle = open(self.log_file, "w+", encoding="utf-8")
|
|
|
|
def _custom_exit(self):
|
|
if (
|
|
self.out_handle is not None
|
|
and self.log_file != "-"
|
|
and self.log_file != "-e"
|
|
):
|
|
self.out_handle.close()
|
|
self.open = False
|
|
|
|
def _colorize_dap_message(self, message: dict) -> dict:
|
|
if not self.colorized:
|
|
return message
|
|
colorized_message = copy.deepcopy(message)
|
|
if colorized_message["type"] == "event":
|
|
colorized_message["type"] = Color.YELLOW.apply("event")
|
|
colorized_message["event"] = Color.YELLOW.apply(colorized_message["event"])
|
|
elif colorized_message["type"] == "response":
|
|
colorized_message["type"] = Color.GREEN.apply("response")
|
|
colorized_message["command"] = Color.YELLOW.apply(
|
|
colorized_message["command"]
|
|
)
|
|
elif colorized_message["type"] == "request":
|
|
colorized_message["type"] = Color.CYAN.apply("request")
|
|
colorized_message["command"] = Color.YELLOW.apply(
|
|
colorized_message["command"]
|
|
)
|
|
return colorized_message
|
|
|
|
def write_message(self, message: dict, incoming: bool):
|
|
prefix = self.prefix_recv if incoming else self.prefix_send
|
|
# ANSI escape codes get butchered by json.dumps(), so we fix them up here.
|
|
message_str = json.dumps(
|
|
self._colorize_dap_message(message), indent=self.indent
|
|
).replace("\\u001b", "\033")
|
|
if self.out_handle is not None and self.open:
|
|
with self.lock:
|
|
self.out_handle.write(f"{prefix} {message_str}\n")
|
|
elif not self.open:
|
|
self.dexter_logger.warning(
|
|
f'Attempted to write message after program closed: "{prefix} {message_str}"'
|
|
)
|
|
|
|
|
|
# Debuggers communicate optional feature support.
|
|
class DAPDebuggerCapabilities:
|
|
def __init__(self):
|
|
self.supportsConfigurationDoneRequest: bool = False
|
|
self.supportsFunctionBreakpoints: bool = False
|
|
self.supportsConditionalBreakpoints: bool = False
|
|
self.supportsHitConditionalBreakpoints: bool = False
|
|
self.supportsEvaluateForHovers: bool = False
|
|
self.supportsSetVariable: bool = False
|
|
self.supportsStepInTargetsRequest: bool = False
|
|
self.supportsModulesRequest: bool = False
|
|
self.supportsValueFormattingOptions: bool = False
|
|
self.supportsLogPoints: bool = False
|
|
self.supportsSetExpression: bool = False
|
|
self.supportsDataBreakpoints: bool = False
|
|
self.supportsReadMemoryRequest: bool = False
|
|
self.supportsWriteMemoryRequest: bool = False
|
|
self.supportsDisassembleRequest: bool = False
|
|
self.supportsCancelRequest: bool = False
|
|
self.supportsSteppingGranularity: bool = False
|
|
self.supportsInstructionBreakpoints: bool = False
|
|
|
|
def update(self, logger: Logger, feature_dict: dict):
|
|
for k, v in feature_dict.items():
|
|
if hasattr(self, k):
|
|
setattr(self, k, v)
|
|
else:
|
|
logger.warning(f"DAP: Unknown support flag: {k}")
|
|
|
|
|
|
# As DAP does not give us a trivially query-able process, we are responsible for maintaining our own state information,
|
|
# including what breakpoints are currently set, and whether the debugger is running or stopped.
|
|
# This class holds all state that is set based on events sent by the debug adapter; most responses are forwarded through
|
|
# to the main DAP class, though in a few cases where it is convenient for bookkeeping the DAPDebuggerState may read some
|
|
# information from the responses before forwarding them onwards.
|
|
class DAPDebuggerState:
|
|
def __init__(self):
|
|
## Overall debugger state information.
|
|
#
|
|
# Whether we have received the initialize update yet.
|
|
self.initialized: bool = False
|
|
# Whether the debugger has successfully launched yet.
|
|
self.launched: bool = False
|
|
# The thread that we are debugging.
|
|
# TODO: This is primitively handled right now, assuming that we only ever have one thread; if we want
|
|
# support for debugging any multi-threaded program then we will need to track some more complex state.
|
|
self.thread = None
|
|
# True if the debuggee is currently executing.
|
|
self.is_running: bool = False
|
|
# True if the debuggee has finished executing.
|
|
self.is_finished: bool = False
|
|
|
|
## Information for the program at a particular stopped point, which will be invalidated when execution resumes.
|
|
#
|
|
# Either None if the debuggee is currently running, or a string specifying the reason why the
|
|
# debuggee is currently stopped otherwise.
|
|
self.stopped_reason = None
|
|
# If we were stopped for the reason 'breakpoint', this will contain a list of the DAP breakpoint IDs
|
|
# responsible for stopping us.
|
|
self.stopped_bps = []
|
|
# For a currently stopped process, stores the mapping of frame indices (top of stack=0) to frameIds returned
|
|
# from the debug adapter.
|
|
self.frame_map = []
|
|
|
|
# We use responses[idx] to refer to the response for the request sent with seq=idx, where the value
|
|
# is either the response payload, or None if the response hasn't arrived yet.
|
|
# Since requests are indexed from 1, we insert a 'None' at the front to ensure that the first real
|
|
# entry is indexed correctly.
|
|
self.responses = [None]
|
|
# Map of DAP breakpoint IDs to resolved instruction addresses.
|
|
self.bp_addr_map = {}
|
|
|
|
# DAP features supported by the debugger.
|
|
self.capabilities = DAPDebuggerCapabilities()
|
|
|
|
def set_response(self, req_id: int, response: dict):
|
|
if len(self.responses) > req_id:
|
|
self.responses[req_id] = response
|
|
return
|
|
while len(self.responses) < req_id:
|
|
self.responses.append(None)
|
|
self.responses.append(response)
|
|
|
|
# As the receiver thread does not know when a request has been sent, and only the receiver thread should write to the DebuggerState object,
|
|
# the responses list may not have been populated with a None for a pending request at the time that the main thread expects it. Therefore,
|
|
# we use this getter to account for requests that the receiver thread is unaware of.
|
|
def get_response(self, req_id: int):
|
|
if len(self.responses) <= req_id:
|
|
return None
|
|
return self.responses[req_id]
|
|
|
|
|
|
# DAP Communication model:
|
|
# - Communication is message-based, not stateful - we cannot simply query information from the debugger as we can with
|
|
# other debugger implementations, we need to maintain local state.
|
|
# - All messages are utf-encoded JSON, which we convert to/from python dicts via methods above; some amount of
|
|
# bookkeeping is performed automatically in the DAP class.
|
|
# - Commands and queries are sent via 'request' messages, for which a corresponding 'response' will always be sent back
|
|
# by the adapter indicating success/failure, containing data related to the request.
|
|
# - The adapter will also send 'event' messages, indicating state changes in the debugger - for example, when the
|
|
# debugger has stopped at a breakpoint.
|
|
# In order to handle this, we run a separate thread that will continuously insert any messages received
|
|
# from the adapter into a queue, which the main thread will read; generally, our response to any read message
|
|
# is to update our state, which Dexter's DebuggerController will then read.
|
|
class DAP(DebuggerBase, metaclass=abc.ABCMeta):
|
|
def __init__(self, context, *args):
|
|
self._debugger_state = DAPDebuggerState()
|
|
self._proc = None
|
|
self._receiver_thread = None
|
|
self._err_thread = None
|
|
self.seq = 0
|
|
self.target_proc_id = -1
|
|
self.max_bp_id = 0
|
|
# Mapping of active breakpoints per-file - intentionally excludes breakpoints that we have deleted.
|
|
# { file -> [dex_breakpoint_id]}
|
|
self.file_to_bp = defaultdict(list)
|
|
# { dex_breakpoint_id -> (file, line, condition) }
|
|
self.bp_info = {}
|
|
# { dex_breakpoint_id -> function_name }
|
|
self.function_bp_info = {}
|
|
# { dex_breakpoint_id -> instruction_reference }
|
|
self.instruction_bp_info = {}
|
|
# We don't rely on IDs returned directly from the debug adapter. Instead, we use dexter breakpoint IDs, and
|
|
# maintain a two-way-mapping of dex_bp_id<->dap_bp_id. This also allows us to defer the setting of breakpoints
|
|
# in the debug adapter itself until necessary.
|
|
# NB: The debug adapter may merge dexter-side breakpoints into a single debugger-side breakpoint; therefore, the
|
|
# DAP->Dex mapping is one-to-many.
|
|
self.dex_id_to_dap_id = {}
|
|
self.dap_id_to_dex_ids = {}
|
|
self.pending_breakpoints: bool = False
|
|
self.pending_function_breakpoints: bool = False
|
|
self.pending_instruction_breakpoints: bool = False
|
|
# List of breakpoints, indexed by BP ID
|
|
# Each entry has the source file (for use in referencing desired_bps), and the DA-assigned
|
|
# ID for that breakpoint if it has one (if it has been removed or not yet created then it will be None).
|
|
# self.bp_source_list: list[(str, int)]
|
|
self.message_logger = None
|
|
super(DAP, self).__init__(context, *args)
|
|
|
|
@property
|
|
@abc.abstractmethod
|
|
def _debug_adapter_name(self) -> str:
|
|
pass
|
|
|
|
@property
|
|
@abc.abstractmethod
|
|
def _debug_adapter_executable(self) -> str:
|
|
pass
|
|
|
|
@property
|
|
def _debug_adapter_launch_args(self) -> list:
|
|
return []
|
|
|
|
@staticmethod
|
|
def make_request(command: str, arguments=None) -> dict:
|
|
request = {"type": "request", "command": command}
|
|
if arguments is not None:
|
|
request["arguments"] = arguments
|
|
return request
|
|
|
|
@staticmethod
|
|
def make_initialize_request(adapterID: str) -> dict:
|
|
return DAP.make_request(
|
|
"initialize",
|
|
{
|
|
"clientID": "dexter",
|
|
"adapterID": adapterID,
|
|
"pathFormat": "path",
|
|
"linesStartAt1": True,
|
|
"columnsStartAt1": True,
|
|
"supportsVariableType": True,
|
|
"supportsVariablePaging": True,
|
|
"supportsRunInTerminalRequest": False,
|
|
},
|
|
)
|
|
|
|
class BreakpointRequest:
|
|
def __init__(self, line: int, condition=None):
|
|
self.line = line
|
|
self.condition = condition
|
|
|
|
def toDict(self) -> dict:
|
|
result = {"line": self.line}
|
|
if self.condition is not None:
|
|
result["condition"] = self.condition
|
|
return result
|
|
|
|
@staticmethod
|
|
def make_set_breakpoint_request(source: str, bps) -> dict:
|
|
return DAP.make_request(
|
|
"setBreakpoints",
|
|
{"source": {"path": source}, "breakpoints": [bp.toDict() for bp in bps]},
|
|
)
|
|
|
|
@staticmethod
|
|
def make_set_function_breakpoint_request(function_names: list) -> dict:
|
|
# Function breakpoints may specify conditions and hit counts, though we
|
|
# don't use those here (though perhaps we should use native hit count,
|
|
# rather than emulating it ConditionalController, now that we have a
|
|
# shared interface (DAP)).
|
|
return DAP.make_request(
|
|
"setFunctionBreakpoints",
|
|
{"breakpoints": [{"name": f} for f in function_names]},
|
|
)
|
|
|
|
@staticmethod
|
|
def make_set_instruction_breakpoint_request(addrs: list) -> dict:
|
|
# Instruction breakpoints have additional fields we're ignoring for the
|
|
# moment.
|
|
return DAP.make_request(
|
|
"setInstructionBreakpoints",
|
|
{"breakpoints": [{"instructionReference": a} for a in addrs]},
|
|
)
|
|
|
|
############################################################################
|
|
## DAP communication & state-handling functions
|
|
|
|
# Sends a request to the adapter, returning the seq value of the request.
|
|
def send_message(self, payload: dict) -> int:
|
|
self.seq = self.seq + 1
|
|
payload["seq"] = self.seq
|
|
self.message_logger.write_message(payload, False)
|
|
body = json.dumps(payload)
|
|
message = f"Content-Length: {len(body)}\r\n\r\n{body}".encode("utf-8")
|
|
self._proc.stdin.write(message)
|
|
self._proc.stdin.flush()
|
|
return self.seq
|
|
|
|
@staticmethod
|
|
def _handle_message(
|
|
message: dict, debugger_state: DAPDebuggerState, logger: Logger
|
|
):
|
|
# We only support events and responses, we do not implement any reverse-requests.
|
|
# TODO: If we find cases where 'seq' becomes important, we need to read it here and process
|
|
# pending messages in order.
|
|
if message["type"] == "event":
|
|
event_type = message["event"]
|
|
event_details = message.get("body")
|
|
if event_type == "initialized":
|
|
debugger_state.initialized = True
|
|
elif event_type == "process":
|
|
debugger_state.launched = True
|
|
debugger_state.is_running = True
|
|
# The debugger has stopped for some reason.
|
|
elif event_type == "stopped":
|
|
stop_reason = event_details["reason"]
|
|
debugger_state.is_running = False
|
|
debugger_state.stopped_reason = stop_reason
|
|
debugger_state.stopped_bps = event_details.get("hitBreakpointIds", [])
|
|
debugger_state.thread = event_details["threadId"]
|
|
elif event_type == "breakpoint":
|
|
# We handle most BP information in the main DAP thread by reading responses to breakpoint requests;
|
|
# some information is only passed via event, however, which we store here.
|
|
breakpoint_details = event_details["breakpoint"]
|
|
if "instructionReference" in breakpoint_details:
|
|
debugger_state.bp_addr_map[
|
|
breakpoint_details["id"]
|
|
] = breakpoint_details["instructionReference"]
|
|
elif event_type == "exited" or event_type == "terminated":
|
|
debugger_state.stopped_reason = event_type
|
|
debugger_state.is_running = False
|
|
debugger_state.is_finished = True
|
|
# We may receive this event before or after the response to the corresponding "continue" request.
|
|
elif event_type == "continued":
|
|
debugger_state.is_running = True
|
|
# Reset all state that is invalidated upon program continue.
|
|
debugger_state.stopped_reason = None
|
|
debugger_state.stopped_bps = []
|
|
debugger_state.frame_map = []
|
|
elif event_type == "thread":
|
|
if (
|
|
event_details["reason"] == "started"
|
|
and debugger_state.thread is None
|
|
):
|
|
debugger_state.thread = event_details["threadId"]
|
|
elif event_type == "capabilities":
|
|
# Unchanged capabilites may not be included.
|
|
debugger_state.capabilities.update(logger, event_details)
|
|
# There are many events we do not care about, just skip processing them.
|
|
else:
|
|
pass
|
|
elif message["type"] == "response":
|
|
# TODO: We also receive a "continued" event, but it seems reasonable to set state based on either the
|
|
# response or the event, since the DAP does not specify an order in which they are sent. May need revisiting
|
|
# if there turns out to be some odd ordering issues, e.g. if we can receive messages in the order
|
|
# ["response: continued", "event: stopped", "event: continued"].
|
|
if (
|
|
message["command"] in ["continue", "stepIn", "next", "stepOut"]
|
|
and message["success"] == True
|
|
):
|
|
debugger_state.is_running = True
|
|
# Reset all state that is invalidated upon program continue.
|
|
debugger_state.stopped_reason = None
|
|
debugger_state.stopped_bps = []
|
|
debugger_state.frame_map = []
|
|
# It is useful to cache a mapping of frames; since this is invalidated when we continue, and only this
|
|
# message-handling thread should write to debugger_state, we do so while handling the response for
|
|
# convenience.
|
|
if message["command"] == "stackTrace" and message["success"] == True:
|
|
debugger_state.frame_map = [
|
|
stackframe["id"] for stackframe in message["body"]["stackFrames"]
|
|
]
|
|
# The debugger communicates which optional DAP features are
|
|
# supported in its initalize response.
|
|
if message["command"] == "initialize" and message["success"] == True:
|
|
body = message.get("body")
|
|
if body:
|
|
debugger_state.capabilities.update(logger, body)
|
|
# Now we've done whatever we need to do with the response, tell the
|
|
# receiver thread we've got it.
|
|
request_seq = message["request_seq"]
|
|
debugger_state.set_response(request_seq, message)
|
|
|
|
@staticmethod
|
|
def _colorize_dap_message(message: dict) -> dict:
|
|
colorized_message = copy.deepcopy(message)
|
|
if colorized_message["type"] == "event":
|
|
colorized_message["type"] = "<y>event</>"
|
|
colorized_message["event"] = f"<y>{colorized_message['event']}</>"
|
|
elif colorized_message["type"] == "response":
|
|
colorized_message["type"] = "<g>response</>"
|
|
colorized_message["command"] = f"<y>{colorized_message['command']}</>"
|
|
elif colorized_message["type"] == "request":
|
|
colorized_message["type"] = "<b>request</>"
|
|
colorized_message["command"] = f"<y>{colorized_message['command']}</>"
|
|
return colorized_message
|
|
|
|
@staticmethod
|
|
def _read_dap_output(
|
|
proc: subprocess.Popen,
|
|
debugger_state: DAPDebuggerState,
|
|
message_logger: DAPMessageLogger,
|
|
logger: Logger,
|
|
):
|
|
buffer: bytes = b""
|
|
while True:
|
|
chunk: bytes = proc.stdout.read(1)
|
|
if not chunk:
|
|
break
|
|
buffer += chunk
|
|
if b"\r\n\r\n" in buffer:
|
|
header, rest = buffer.split(b"\r\n\r\n", 1)
|
|
content_length = int(header.decode().split(":")[1].strip())
|
|
while len(rest) < content_length:
|
|
rest += proc.stdout.read(content_length - len(rest))
|
|
message = json.loads(rest[:content_length])
|
|
message_logger.write_message(message, True)
|
|
DAP._handle_message(message, debugger_state, logger)
|
|
buffer = rest[content_length:]
|
|
|
|
@staticmethod
|
|
def _read_dap_err(proc: subprocess.Popen, logger: Logger):
|
|
while True:
|
|
err: bytes = proc.stderr.readline()
|
|
if len(err) > 0:
|
|
logger.error(f"DAP server: {err.decode().strip()}")
|
|
|
|
def _custom_init(self):
|
|
self.context.logger.note(
|
|
f"Opening DAP server: {shlex.join([self._debug_adapter_executable] + self._debug_adapter_launch_args)}"
|
|
)
|
|
self.message_logger = DAPMessageLogger(self.context)
|
|
self.message_logger._custom_enter()
|
|
self._proc = subprocess.Popen(
|
|
[self._debug_adapter_executable] + self._debug_adapter_launch_args,
|
|
stdin=subprocess.PIPE,
|
|
stdout=subprocess.PIPE,
|
|
stderr=subprocess.PIPE,
|
|
bufsize=0,
|
|
)
|
|
self._receiver_thread = threading.Thread(
|
|
target=DAP._read_dap_output,
|
|
args=(
|
|
self._proc,
|
|
self._debugger_state,
|
|
self.message_logger,
|
|
self.context.logger,
|
|
),
|
|
daemon=True,
|
|
)
|
|
self._err_thread = threading.Thread(
|
|
target=DAP._read_dap_err,
|
|
args=(self._proc, self.context.logger),
|
|
daemon=True,
|
|
)
|
|
self._receiver_thread.start()
|
|
self._err_thread.start()
|
|
init_req = self.send_message(
|
|
self.make_initialize_request(self._debug_adapter_name)
|
|
)
|
|
assert self._proc.poll() is None, "Process has closed unexpectedly early?"
|
|
self._await_response(init_req)
|
|
|
|
def _custom_exit(self):
|
|
if self._proc is not None:
|
|
dc_req = self.send_message(self.make_request("disconnect"))
|
|
dc_req_timeout = 3
|
|
try:
|
|
result = self._await_response(dc_req, dc_req_timeout)
|
|
if not result["success"]:
|
|
self.context.logger.warning(
|
|
"The disconnect request sent to the DAP server failed; forcibly shutting down DAP server."
|
|
)
|
|
else:
|
|
self.context.logger.note(
|
|
"Successfully disconnected from DAP server."
|
|
)
|
|
except:
|
|
# We're going to kill the process regardless, we just want to give the target a chance to shut down
|
|
# gracefully first.
|
|
self.context.logger.warning(
|
|
f"The disconnect request sent to the DAP server timed out after {dc_req_timeout}s; forcibly shutting down DAP server."
|
|
)
|
|
pass
|
|
self._proc.kill()
|
|
self._proc = None
|
|
self.message_logger._custom_exit()
|
|
|
|
# Waits for a response to the request with the given seq, optionally raising an error
|
|
# if the response takes too long (blocks forever by default/if timeout=0).
|
|
def _await_response(self, seq: int, timeout: float = 0.0) -> dict:
|
|
timeout_check = Timeout(timeout)
|
|
while self._debugger_state.get_response(seq) is None:
|
|
if timeout_check.timed_out():
|
|
if self._proc.poll() is not None:
|
|
self.context.logger.error(
|
|
f"Debug adapter exited while Dexter is awaiting response? Result: {self._proc.poll()}"
|
|
)
|
|
raise TimeoutError(
|
|
f"Timed out while waiting for response to DAP request {seq}"
|
|
)
|
|
time.sleep(0.001)
|
|
return self._debugger_state.get_response(seq)
|
|
|
|
## End of DAP communication methods
|
|
############################################################################
|
|
|
|
def _translate_stop_reason(self, reason):
|
|
if reason is None:
|
|
return None
|
|
if "breakpoint" in reason:
|
|
return StopReason.BREAKPOINT
|
|
if reason == "step":
|
|
return StopReason.STEP
|
|
if reason == "exited" or reason == "terminated":
|
|
return StopReason.PROGRAM_EXIT
|
|
if reason == "exception":
|
|
return StopReason.ERROR
|
|
return StopReason.OTHER
|
|
|
|
def _load_interface(self):
|
|
if not os.path.isfile(self._debug_adapter_executable):
|
|
raise LoadDebuggerException(
|
|
f'debug adapter "{self._debug_adapter_executable}" does not exist',
|
|
sys.exc_info(),
|
|
)
|
|
# We don't make use of _interface, so return nothing.
|
|
|
|
@property
|
|
@abc.abstractmethod
|
|
def version(self):
|
|
"""The version of this DAP debugger."""
|
|
|
|
############################################################################
|
|
## Breakpoint Methods
|
|
|
|
def get_next_bp_id(self):
|
|
new_id = self.max_bp_id
|
|
self.max_bp_id += 1
|
|
return new_id
|
|
|
|
def get_current_bps(self, source):
|
|
if source in self.file_to_bp:
|
|
return self.file_to_bp[source]
|
|
return []
|
|
|
|
def _update_requested_bp_list(self, bp_list):
|
|
"""Can be overridden for any specific implementations that need further processing before sending breakpoints to
|
|
the debug adapter, e.g. in LLDB we cannot store multiple breakpoints at a single location, and therefore must
|
|
combine conditions for breakpoints at the same location."""
|
|
return bp_list
|
|
|
|
# For a source file, returns the list of BreakpointRequests for the breakpoints in that file, which can be sent to
|
|
# the debug adapter.
|
|
def _get_desired_bps(self, file: str):
|
|
bp_list = [
|
|
DAP.BreakpointRequest(line, cond)
|
|
for (_, line, cond) in map(
|
|
lambda dex_bp_id: self.bp_info[dex_bp_id], self.get_current_bps(file)
|
|
)
|
|
]
|
|
return self._update_requested_bp_list(bp_list)
|
|
|
|
def clear_breakpoints(self):
|
|
# We don't actually need to do anything here - even if breakpoints were preserved between runs, we will
|
|
# automatically clear old breakpoints on the first 'setBreakpoints' message.
|
|
pass
|
|
|
|
def _add_breakpoint(self, file, line):
|
|
return self._add_conditional_breakpoint(file, line, None)
|
|
|
|
def add_function_breakpoint(self, name: str):
|
|
if not self._debugger_state.capabilities.supportsFunctionBreakpoints:
|
|
raise DebuggerException("Debugger does not support function breakpoints")
|
|
new_id = self.get_next_bp_id()
|
|
self.function_bp_info[new_id] = name
|
|
self.pending_function_breakpoints = True
|
|
return new_id
|
|
|
|
def add_instruction_breakpoint(self, addr: str):
|
|
if not self._debugger_state.capabilities.supportsInstructionBreakpoints:
|
|
raise DebuggerException("Debugger does not support instruction breakpoints")
|
|
new_id = self.get_next_bp_id()
|
|
self.instruction_bp_info[new_id] = addr
|
|
self.pending_instruction_breakpoints = True
|
|
return new_id
|
|
|
|
def _add_conditional_breakpoint(self, file, line, condition):
|
|
new_id = self.get_next_bp_id()
|
|
self.file_to_bp[file].append(new_id)
|
|
self.bp_info[new_id] = (file, line, condition)
|
|
self.pending_breakpoints = True
|
|
return new_id
|
|
|
|
def _update_breakpoint_ids_after_request(self, dex_bp_ids: list, response: dict):
|
|
dap_bp_ids = [bp["id"] for bp in response["body"]["breakpoints"]]
|
|
if len(dex_bp_ids) != len(dap_bp_ids):
|
|
self.context.logger.error(
|
|
f"Sent request to set {len(dex_bp_ids)} breakpoints, but received {len(dap_bp_ids)} in response."
|
|
)
|
|
visited_dap_ids = set()
|
|
for i, dex_bp_id in enumerate(dex_bp_ids):
|
|
dap_bp_id = dap_bp_ids[i]
|
|
self.dex_id_to_dap_id[dex_bp_id] = dap_bp_id
|
|
# We take the mappings in the response as the canonical mapping, meaning that if the debug server has
|
|
# simply *changed* the DAP ID for a breakpoint we overwrite the existing mapping rather than adding to
|
|
# it, but if we receive the same DAP ID for multiple Dex IDs *then* we store a one-to-many mapping.
|
|
if dap_bp_id in visited_dap_ids:
|
|
self.dap_id_to_dex_ids[dap_bp_id].append(dex_bp_id)
|
|
else:
|
|
self.dap_id_to_dex_ids[dap_bp_id] = [dex_bp_id]
|
|
visited_dap_ids.add(dap_bp_id)
|
|
|
|
def _flush_breakpoints(self):
|
|
# Normal and conditional breakpoints.
|
|
if self.pending_breakpoints:
|
|
self.pending_breakpoints = False
|
|
for file in self.file_to_bp.keys():
|
|
desired_bps = self._get_desired_bps(file)
|
|
request_id = self.send_message(
|
|
self.make_set_breakpoint_request(file, desired_bps)
|
|
)
|
|
result = self._await_response(request_id, 10)
|
|
if not result["success"]:
|
|
raise DebuggerException(f"could not set breakpoints for '{file}'")
|
|
# The debug adapter may have chosen to merge our breakpoints. From here we need to identify such cases and
|
|
# handle them so that our internal bookkeeping is correct.
|
|
dex_bp_ids = self.get_current_bps(file)
|
|
self._update_breakpoint_ids_after_request(dex_bp_ids, result)
|
|
|
|
# Function breakpoints.
|
|
if self.pending_function_breakpoints:
|
|
self.pending_function_breakpoints = False
|
|
desired_bps = list(self.function_bp_info.values())
|
|
request_id = self.send_message(
|
|
self.make_set_function_breakpoint_request(desired_bps)
|
|
)
|
|
result = self._await_response(request_id, 10)
|
|
if not result["success"]:
|
|
raise DebuggerException(
|
|
f"could not set function breakpoints: '{desired_bps}'"
|
|
)
|
|
# We expect the breakpoint order to match in request and response.
|
|
dex_bp_ids = list(self.function_bp_info.keys())
|
|
self._update_breakpoint_ids_after_request(dex_bp_ids, result)
|
|
|
|
# Address / instruction breakpoints.
|
|
if self.pending_instruction_breakpoints:
|
|
self.pending_instruction_breakpoints = False
|
|
desired_bps = list(self.instruction_bp_info.values())
|
|
request_id = self.send_message(
|
|
self.make_set_instruction_breakpoint_request(desired_bps)
|
|
)
|
|
result = self._await_response(request_id, 10)
|
|
if not result["success"]:
|
|
raise DebuggerException(
|
|
f"could not set instruction breakpoints: '{desired_bps}'"
|
|
)
|
|
# We expect the breakpoint order to match in request and response.
|
|
dex_bp_ids = list(self.instruction_bp_info.keys())
|
|
self._update_breakpoint_ids_after_request(dex_bp_ids, result)
|
|
|
|
def _confirm_triggered_breakpoint_ids(self, dex_bp_ids):
|
|
"""Can be overridden for any specific implementations that need further processing from the debug server's
|
|
reported 'hitBreakpointIds', e.g. in LLDB where we the ID for every breakpoint at the current PC, even if some
|
|
are conditional and their condition is not met."""
|
|
return dex_bp_ids
|
|
|
|
def get_triggered_breakpoint_ids(self):
|
|
# Breakpoints can only have been triggered if we've hit one.
|
|
stop_reason = self._translate_stop_reason(self._debugger_state.stopped_reason)
|
|
if stop_reason != StopReason.BREAKPOINT:
|
|
return set()
|
|
breakpoint_ids = set(
|
|
[
|
|
dex_id
|
|
for dap_id in self._debugger_state.stopped_bps
|
|
if dap_id in self.dap_id_to_dex_ids
|
|
for dex_id in self.dap_id_to_dex_ids[dap_id]
|
|
]
|
|
)
|
|
return self._confirm_triggered_breakpoint_ids(breakpoint_ids)
|
|
|
|
def delete_breakpoints(self, ids):
|
|
per_file_deletions = defaultdict(list)
|
|
for dex_bp_id in ids:
|
|
if dex_bp_id in self.bp_info:
|
|
source, _, _ = self.bp_info[dex_bp_id]
|
|
per_file_deletions[source].append(dex_bp_id)
|
|
elif dex_bp_id in self.function_bp_info:
|
|
del self.function_bp_info[dex_bp_id]
|
|
self.pending_function_breakpoints = True
|
|
elif dex_bp_id in self.instruction_bp_info:
|
|
del self.instruction_bp_info[dex_bp_id]
|
|
self.pending_instruction_breakpoints = True
|
|
|
|
for file, deleted_ids in per_file_deletions.items():
|
|
old_len = len(self.file_to_bp[file])
|
|
self.file_to_bp[file] = [
|
|
bp_id for bp_id in self.file_to_bp[file] if bp_id not in deleted_ids
|
|
]
|
|
if len(self.file_to_bp[file]) != old_len:
|
|
self.pending_breakpoints = True
|
|
|
|
## End of breakpoint methods
|
|
############################################################################
|
|
|
|
@classmethod
|
|
@abc.abstractmethod
|
|
def _get_launch_params(self, cmdline):
|
|
""" "Set the debugger-specific params used in a launch request."""
|
|
|
|
def launch(self, cmdline):
|
|
# FIXME: Should this be a warning or exception, rather than assert?
|
|
assert (
|
|
len(self.file_to_bp)
|
|
+ len(self.function_bp_info)
|
|
+ len(self.instruction_bp_info)
|
|
> 0
|
|
), "Expected at least one breakpoint before launching"
|
|
|
|
if self.context.options.target_run_args:
|
|
cmdline += shlex.split(self.context.options.target_run_args)
|
|
|
|
launch_request = self._get_launch_params(cmdline)
|
|
|
|
# Per DAP protocol, we follow the sequence:
|
|
# 1. Send launch request
|
|
# 2. Set breakpoints
|
|
# 3. Send configurationDone to start the process
|
|
# 4. Wait for launch and configurationDone responses, and a "process" event, to confirm successful launch
|
|
# NB: Technically, we should also wait for the "initialized" event before sending the launch request, but in
|
|
# practice there are DAP implementations that do not send the initialized event until post-launch, and all
|
|
# adapters seem to accept us not waiting for the initialized event, so ignoring it gives maximum compatibility.
|
|
launch_req_id = self.send_message(self.make_request("launch", launch_request))
|
|
|
|
# Wait for the initialized event; for LLDB, this will be sent after the launch request has been processed;
|
|
# for other debuggers, it will have been sent some time after the initialize response was sent.
|
|
# NB: In all current cases this timeout is never hit because the initialized event is received almost
|
|
# immediately after either the initialize response or the launch request/response; if this starts being hit, we
|
|
# probably need to parameterize this.
|
|
initialize_timeout = Timeout(3)
|
|
while not self._debugger_state.initialized:
|
|
if initialize_timeout.timed_out():
|
|
raise TimeoutError(
|
|
f"Timed out while waiting for initialized event from DAP"
|
|
)
|
|
time.sleep(0.001)
|
|
|
|
# Set breakpoints after receiving launch response but before configurationDone.
|
|
self._flush_breakpoints()
|
|
|
|
# Send configurationDone to allow the process to start running.
|
|
config_done_req_id = self.send_message(self.make_request("configurationDone"))
|
|
launch_response = self._await_response(launch_req_id)
|
|
if not launch_response["success"]:
|
|
raise DebuggerException(
|
|
f"failure launching debugger: \"{launch_response['body']['error']['format']}\""
|
|
)
|
|
config_done_response = self._await_response(config_done_req_id)
|
|
assert config_done_response["success"]
|
|
|
|
# Wait for the process to launch and obtain a thread ID.
|
|
while self._debugger_state.thread is None or not self._debugger_state.launched:
|
|
time.sleep(0.001)
|
|
|
|
# LLDB has unique stepping behaviour w.r.t. breakpoints that needs to be handled after completing a step, so we use
|
|
# an overridable hook to enable debugger-specific behaviour.
|
|
def _post_step_hook(self):
|
|
"""Hook to be executed after completing a step request."""
|
|
|
|
def _step(self, step_request_string):
|
|
self._flush_breakpoints()
|
|
step_req_id = self.send_message(
|
|
self.make_request(
|
|
step_request_string, {"threadId": self._debugger_state.thread}
|
|
)
|
|
)
|
|
response = self._await_response(step_req_id)
|
|
if not response["success"]:
|
|
raise DebuggerException(
|
|
f"failed to perform debugger action: '{step_request_string}'"
|
|
)
|
|
# If we've "stepped" to a breakpoint, then continue to hit the breakpoint properly.
|
|
# NB: This is an issue that only seems relevant to LLDB, but is also harmless outside of LLDB; if it turns out
|
|
# to cause issues for other debuggers, we can move it to a post-step hook.
|
|
while self._debugger_state.is_running:
|
|
time.sleep(0.001)
|
|
self._post_step_hook()
|
|
|
|
def step_in(self):
|
|
self._step("stepIn")
|
|
|
|
def step_next(self):
|
|
self._step("next")
|
|
|
|
def step_out(self):
|
|
self._step("stepOut")
|
|
|
|
def go(self) -> ReturnCode:
|
|
self._flush_breakpoints()
|
|
continue_req_id = self.send_message(
|
|
self.make_request("continue", {"threadId": self._debugger_state.thread})
|
|
)
|
|
response = self._await_response(continue_req_id)
|
|
if not response["success"]:
|
|
raise DebuggerException("failed to continue")
|
|
# Assuming the request to continue succeeded, we still need to wait to receive an event back from the debugger
|
|
# indicating that we have successfully resumed.
|
|
|
|
def _get_step_info(self, watches, step_index):
|
|
assert (
|
|
not self._debugger_state.is_running
|
|
), "Cannot get step info while debugger is running!"
|
|
trace_req_id = self.send_message(
|
|
self.make_request("stackTrace", {"threadId": self._debugger_state.thread})
|
|
)
|
|
trace_response = self._await_response(trace_req_id)
|
|
if not trace_response["success"]:
|
|
raise DebuggerException("failed to get stack frames")
|
|
stackframes = trace_response["body"]["stackFrames"]
|
|
|
|
frames = []
|
|
state_frames = []
|
|
|
|
for idx, stackframe in enumerate(stackframes):
|
|
# FIXME: No source, skip the frame! Currently I've only observed this for frames below main, so we break
|
|
# here; if it happens elsewhere, then this will break more stuff and we'll come up with a better solution.
|
|
if (
|
|
stackframe.get("source") is None
|
|
or stackframe["source"].get("path") is None
|
|
):
|
|
break
|
|
loc_dict = {
|
|
"path": stackframe["source"]["path"],
|
|
"lineno": stackframe["line"],
|
|
"column": stackframe["column"],
|
|
}
|
|
loc = LocIR(**loc_dict)
|
|
valid_loc_for_watch = loc.path and os.path.exists(loc.path)
|
|
frame = FrameIR(
|
|
function=self._sanitize_function_name(stackframe["name"]),
|
|
is_inlined=stackframe["name"].startswith("[Inline Frame]"),
|
|
loc=loc,
|
|
)
|
|
|
|
# We skip frames that are below "main", since we do not expect those to be user code.
|
|
fname = frame.function or "" # pylint: disable=no-member
|
|
if any(name in fname for name in self.frames_below_main):
|
|
break
|
|
|
|
frames.append(frame)
|
|
|
|
state_frame = StackFrame(
|
|
function=frame.function,
|
|
is_inlined=frame.is_inlined,
|
|
location=SourceLocation(**loc_dict),
|
|
watches={},
|
|
)
|
|
if valid_loc_for_watch:
|
|
for expr in map(
|
|
# Filter out watches that are not active in the current frame,
|
|
# and then evaluate all the active watches.
|
|
lambda watch_info, idx=idx: self.evaluate_expression(
|
|
watch_info.expression, idx
|
|
),
|
|
filter(
|
|
lambda watch_info, idx=idx, line_no=loc.lineno, loc_path=loc.path: watch_is_active(
|
|
watch_info, loc_path, idx, line_no
|
|
),
|
|
watches,
|
|
),
|
|
):
|
|
state_frame.watches[expr.expression] = expr
|
|
state_frames.append(state_frame)
|
|
|
|
if len(frames) == 1 and frames[0].function is None:
|
|
frames = []
|
|
state_frames = []
|
|
|
|
reason = self._translate_stop_reason(self._debugger_state.stopped_reason)
|
|
|
|
return StepIR(
|
|
step_index=step_index,
|
|
frames=frames,
|
|
stop_reason=reason,
|
|
program_state=ProgramState(state_frames),
|
|
)
|
|
|
|
@property
|
|
def is_running(self):
|
|
return self._debugger_state.is_running
|
|
|
|
@property
|
|
def is_finished(self):
|
|
return self._debugger_state.is_finished
|
|
|
|
@property
|
|
def frames_below_main(self):
|
|
pass
|
|
|
|
@staticmethod
|
|
@abc.abstractmethod
|
|
def _evaluate_result_value(expression: str, result_string: str) -> ValueIR:
|
|
"""For the result of an "evaluate" message, return a ValueIR. Implementation must be debugger-specific."""
|
|
|
|
def evaluate_expression(self, expression, frame_idx=0) -> ValueIR:
|
|
# The frame_idx passed in here needs to be translated to the debug adapter's internal frame ID.
|
|
dap_frame_id = self._debugger_state.frame_map[frame_idx]
|
|
eval_req_id = self.send_message(
|
|
self.make_request(
|
|
"evaluate",
|
|
{
|
|
"expression": expression,
|
|
"frameId": dap_frame_id,
|
|
"context": "watch",
|
|
},
|
|
)
|
|
)
|
|
eval_response = self._await_response(eval_req_id)
|
|
result: str = ""
|
|
if not eval_response["success"]:
|
|
if eval_response["body"].get("error", None):
|
|
result = eval_response["body"]["error"]["format"]
|
|
elif eval_response["message"]:
|
|
result = eval_response["message"]
|
|
else:
|
|
result = "<unable to evaluate expression>"
|
|
else:
|
|
result = eval_response["body"]["result"]
|
|
type_str = eval_response["body"].get("type")
|
|
|
|
return self._evaluate_result_value(expression, result, type_str)
|