Files
qt-creator/src/plugins/debugger/cdb/cdbparsehelpers.cpp
hjk 41df1fb2d3 debugger: rewrite parser for cli sub-breakpoint notifications
Change-Id: I971a2af2534bc650e8c604a5c2dc2e1846dbb045
Reviewed-on: http://codereview.qt.nokia.com/592
Reviewed-by: hjk <qthjk@ovi.com>
2011-06-22 12:23:46 +02:00

598 lines
21 KiB
C++

/**************************************************************************
**
** This file is part of Qt Creator
**
** Copyright (c) 2011 Nokia Corporation and/or its subsidiary(-ies).
**
** Contact: Nokia Corporation (info@qt.nokia.com)
**
**
** GNU Lesser General Public License Usage
**
** This file may be used under the terms of the GNU Lesser General Public
** License version 2.1 as published by the Free Software Foundation and
** appearing in the file LICENSE.LGPL included in the packaging of this file.
** Please review the following information to ensure the GNU Lesser General
** Public License version 2.1 requirements will be met:
** http://www.gnu.org/licenses/old-licenses/lgpl-2.1.html.
**
** In addition, as a special exception, Nokia gives you certain additional
** rights. These rights are described in the Nokia Qt LGPL Exception
** version 1.1, included in the file LGPL_EXCEPTION.txt in this package.
**
** Other Usage
**
** Alternatively, this file may be used in accordance with the terms and
** conditions contained in a signed written agreement between you and Nokia.
**
** If you have questions regarding the use of this file, please contact
** Nokia at info@qt.nokia.com.
**
**************************************************************************/
#include "cdbparsehelpers.h"
#include "breakpoint.h"
#include "threadshandler.h"
#include "registerhandler.h"
#include "bytearrayinputstream.h"
#include "gdb/gdbmi.h"
#include "disassemblerlines.h"
#ifdef Q_OS_WIN
# include "shared/dbgwinutils.h"
#endif
#include <utils/qtcassert.h>
#include <QtCore/QByteArray>
#include <QtCore/QVariant>
#include <QtCore/QString>
#include <QtCore/QDir>
#include <QtCore/QDebug>
#include <cctype>
enum { debugDisAsm = 0 };
namespace Debugger {
namespace Internal {
// Perform mapping on parts of the source tree as reported by/passed to debugger
// in case the user has specified such mappings in the global settings.
// That is, when debugging an executable built from 'X:\buildsrv\foo.cpp' and using a local
// source tree under 'c:\src', the user would specify a mapping 'X:\buildsrv'->'c:\src'
// and file names passed to breakpoints and reported stack traces can be converted.
QString cdbSourcePathMapping(QString fileName,
const QList<QPair<QString, QString> > &sourcePathMapping,
SourcePathMode mode)
{
typedef QPair<QString, QString> SourcePathMapping;
if (fileName.isEmpty() || sourcePathMapping.isEmpty())
return fileName;
foreach (const SourcePathMapping &m, sourcePathMapping) {
const QString &source = mode == DebuggerToSource ? m.first : m.second;
const int sourceSize = source.size();
// Map parts of the path and ensure a slash follows.
if (fileName.size() > sourceSize && fileName.startsWith(source, Qt::CaseInsensitive)) {
const QChar next = fileName.at(sourceSize);
if (next == QLatin1Char('\\') || next == QLatin1Char('/')) {
const QString &target = mode == DebuggerToSource ? m.second: m.first;
fileName.replace(0, sourceSize, target);
return fileName;
}
}
}
return fileName;
}
// Determine file name to be used for breakpoints. Convert to native and, unless short path
// is set, perform reverse lookup in the source path mappings.
static inline QString cdbBreakPointFileName(const BreakpointParameters &bp,
const QList<QPair<QString, QString> > &sourcePathMapping)
{
if (bp.fileName.isEmpty())
return bp.fileName;
if (bp.pathUsage == BreakpointUseShortPath)
return QFileInfo(bp.fileName).fileName();
return cdbSourcePathMapping(QDir::toNativeSeparators(bp.fileName), sourcePathMapping, SourceToDebugger);
}
static BreakpointParameters fixWinMSVCBreakpoint(const BreakpointParameters &p)
{
switch (p.type) {
case UnknownType:
case BreakpointByFileAndLine:
case BreakpointByFunction:
case BreakpointByAddress:
case BreakpointAtFork:
case WatchpointAtExpression:
case BreakpointAtSysCall:
case WatchpointAtAddress:
break;
case BreakpointAtExec: { // Emulate by breaking on CreateProcessW().
BreakpointParameters rc(BreakpointByFunction);
rc.module = QLatin1String("kernel32");
rc.functionName = QLatin1String("CreateProcessW");
return rc;
}
case BreakpointAtThrow: {
BreakpointParameters rc(BreakpointByFunction);
rc.functionName = QLatin1String("CxxThrowException"); // MSVC runtime. Potentially ambiguous.
return rc;
}
case BreakpointAtCatch: {
BreakpointParameters rc(BreakpointByFunction);
rc.functionName = QLatin1String("__CxxCallCatchBlock"); // MSVC runtime. Potentially ambiguous.
return rc;
}
case BreakpointAtMain: {
BreakpointParameters rc(BreakpointByFunction);
rc.functionName = QLatin1String("main");
return rc;
}
} // switch
return p;
}
QByteArray cdbAddBreakpointCommand(const BreakpointParameters &bpIn,
const QList<QPair<QString, QString> > &sourcePathMapping,
BreakpointId id /* = BreakpointId() */,
bool oneshot)
{
const BreakpointParameters bp = fixWinMSVCBreakpoint(bpIn);
QByteArray rc;
ByteArrayInputStream str(rc);
if (bp.threadSpec >= 0)
str << '~' << bp.threadSpec << ' ';
// Currently use 'bu' so that the offset expression (including file name)
// is kept when reporting back breakpoints (which is otherwise discarded
// when resolving).
str << (bp.type == WatchpointAtAddress ? "ba" : "bu");
if (id.isValid())
str << id.toString();
str << ' ';
if (oneshot)
str << "/1 ";
switch (bp.type) {
case BreakpointAtFork:
case BreakpointAtExec:
case WatchpointAtExpression:
case BreakpointAtSysCall:
case UnknownType:
case BreakpointAtCatch:
case BreakpointAtThrow:
case BreakpointAtMain:
QTC_ASSERT(false, return QByteArray(); )
break;
case BreakpointByAddress:
str << hex << hexPrefixOn << bp.address << hexPrefixOff << dec;
break;
case BreakpointByFunction:
if (!bp.module.isEmpty())
str << bp.module << '!';
str << bp.functionName;
break;
case BreakpointByFileAndLine:
str << '`';
if (!bp.module.isEmpty())
str << bp.module << '!';
str << cdbBreakPointFileName(bp, sourcePathMapping) << ':' << bp.lineNumber << '`';
break;
case WatchpointAtAddress: { // Read/write, no space here
const unsigned size = bp.size ? bp.size : 1;
str << "r" << size << ' ' << hex << hexPrefixOn << bp.address << hexPrefixOff << dec;
}
break;
}
if (bp.ignoreCount)
str << ' ' << (bp.ignoreCount + 1);
// Condition currently unsupported.
if (!bp.command.isEmpty())
str << " \"" << bp.command << '"';
return rc;
}
// Fix a CDB integer value: '00000000`0012a290' -> '12a290', '0n10' ->'10'
QByteArray fixCdbIntegerValue(QByteArray t, bool stripLeadingZeros, int *basePtr /* = 0 */)
{
if (t.isEmpty())
return t;
int base = 16;
// Prefixes
if (t.startsWith("0x")) {
t.remove(0, 2);
} else if (t.startsWith("0n")) {
base = 10;
t.remove(0, 2);
}
if (base == 16 && t.size() >= 9 && t.at(8) == '`')
t.remove(8, 1);
if (stripLeadingZeros) { // Strip all but last '0'
const int last = t.size() - 1;
int pos = 0;
for ( ; pos < last && t.at(pos) == '0'; pos++) ;
if (pos)
t.remove(0, pos);
}
if (basePtr)
*basePtr = base;
return t;
}
// Convert a CDB integer value: '00000000`0012a290' -> '12a290', '0n10' ->'10'
QVariant cdbIntegerValue(const QByteArray &t)
{
int base;
const QByteArray fixed = fixCdbIntegerValue(t, false, &base);
bool ok;
const QVariant converted = base == 16 ?
fixed.toULongLong(&ok, base) :
fixed.toLongLong(&ok, base);
QTC_ASSERT(ok, return QVariant(); )
return converted;
}
/* \code
0:002> ~ [Debugger-Id] Id: <hex pid> <hex tid> Suspends count thread environment block add state name
0 Id: 133c.1374 Suspend: 1 Teb: 000007ff`fffdd000 Unfrozen
. 2 Id: 133c.1160 Suspend: 1 Teb: 000007ff`fffd9000 Unfrozen "QThread"
3 Id: 133c.38c Suspend: 1 Teb: 000007ff`fffd7000 Unfrozen "QThread"
\endcode */
static inline bool parseThread(QByteArray line, ThreadData *thread, bool *current)
{
*current = false;
if (line.size() < 5)
return false;
*current = line.at(0) == '.';
if (current)
line[0] = ' ';
const QList<QByteArray> tokens = simplify(line).split(' ');
if (tokens.size() < 8 || tokens.at(1) != "Id:")
return false;
switch (tokens.size()) { // fallthru intended
case 9:
thread->name = QString::fromLocal8Bit(tokens.at(8));
case 8:
thread->state = QString::fromLocal8Bit(tokens.at(7));
case 3: {
const QByteArray &pidTid = tokens.at(2);
const int dotPos = pidTid.indexOf('.');
if (dotPos != -1)
thread->targetId = QLatin1String("0x") + QString::fromAscii(pidTid.mid(dotPos + 1));
}
case 1:
thread->id = tokens.at(0).toInt();
break;
} // switch size
return true;
}
// Helper to retrieve an int child from GDBMI
static inline bool gdbmiChildToInt(const GdbMi &parent, const char *childName, int *target)
{
const GdbMi childBA = parent.findChild(childName);
if (childBA.isValid()) {
bool ok;
const int v = childBA.data().toInt(&ok);
if (ok) {
*target = v;
return true;
}
}
return false;
}
// Helper to retrieve an bool child from GDBMI
static inline bool gdbmiChildToBool(const GdbMi &parent, const char *childName, bool *target)
{
const GdbMi childBA = parent.findChild(childName);
if (childBA.isValid()) {
*target = childBA.data() == "true";
return true;
}
return false;
}
// Parse extension command listing breakpoints.
// Note that not all fields are returned, since file, line, function are encoded
// in the expression (that is in addition deleted on resolving for a bp-type breakpoint).
BreakpointId parseBreakPoint(const GdbMi &gdbmi, BreakpointResponse *r,
QString *expression /* = 0 */)
{
BreakpointId id = BreakpointId(-1);
int majorPart = 0;
gdbmiChildToInt(gdbmi, "number", &majorPart);
gdbmiChildToBool(gdbmi, "enabled", &(r->enabled));
gdbmiChildToBool(gdbmi, "deferred", &(r->pending));
r->id = BreakpointId(majorPart);
const GdbMi idG = gdbmi.findChild("id");
if (idG.isValid()) { // Might not be valid if there is not id
bool ok;
const BreakpointId cid(idG.data().toInt(&ok));
if (ok)
id = cid;
}
const GdbMi moduleG = gdbmi.findChild("module");
if (moduleG.isValid())
r->module = QString::fromLocal8Bit(moduleG.data());
if (expression) {
const GdbMi expressionG = gdbmi.findChild("expression");
if (expressionG.isValid())
*expression = QString::fromLocal8Bit(expressionG.data());
}
const GdbMi addressG = gdbmi.findChild("address");
if (addressG.isValid())
r->address = addressG.data().toULongLong(0, 0);
if (gdbmiChildToInt(gdbmi, "passcount", &(r->ignoreCount)))
r->ignoreCount--;
gdbmiChildToInt(gdbmi, "thread", &(r->threadSpec));
return id;
}
QByteArray cdbWriteMemoryCommand(quint64 addr, const QByteArray &data)
{
QByteArray cmd;
ByteArrayInputStream str(cmd);
str.setIntegerBase(16);
str << "f " << addr << " L" << data.size();
const int count = data.size();
for (int i = 0 ; i < count ; i++ ) {
const unsigned char uc = (unsigned char)data.at(i);
str << ' ' << unsigned(uc);
}
return cmd;
}
QString debugByteArray(const QByteArray &a)
{
QString rc;
const int size = a.size();
rc.reserve(size * 2);
QTextStream str(&rc);
for (int i = 0; i < size; i++) {
const unsigned char uc = (unsigned char)(a.at(i));
switch (uc) {
case 0:
str << "\\0";
break;
case '\n':
str << "\\n";
break;
case '\t':
str << "\\t";
break;
case '\r':
str << "\\r";
break;
default:
if (uc >=32 && uc < 128) {
str << a.at(i);
} else {
str << '<' << unsigned(uc) << '>';
}
break;
}
}
return rc;
}
QString StringFromBase64EncodedUtf16(const QByteArray &a)
{
QByteArray utf16 = QByteArray::fromBase64(a);
utf16.append('\0');
utf16.append('\0');
return QString::fromUtf16(reinterpret_cast<const unsigned short *>(utf16.constData()));
}
WinException::WinException() :
exceptionCode(0), exceptionFlags(0), exceptionAddress(0),
info1(0),info2(0), firstChance(false), lineNumber(0)
{
}
void WinException::fromGdbMI(const GdbMi &gdbmi)
{
exceptionCode = gdbmi.findChild("exceptionCode").data().toUInt();
exceptionFlags = gdbmi.findChild("exceptionFlags").data().toUInt();
exceptionAddress = gdbmi.findChild("exceptionAddress").data().toULongLong();
firstChance = gdbmi.findChild("firstChance").data() != "0";
const GdbMi ginfo1 = gdbmi.findChild("exceptionInformation0");
if (ginfo1.isValid()) {
info1 = ginfo1.data().toULongLong();
const GdbMi ginfo2 = gdbmi.findChild("exceptionInformation1");
if (ginfo2.isValid())
info2 = ginfo1.data().toULongLong();
}
const GdbMi gLineNumber = gdbmi.findChild("exceptionLine");
if (gLineNumber.isValid()) {
lineNumber = gLineNumber.data().toInt();
file = gdbmi.findChild("exceptionFile").data();
}
function = gdbmi.findChild("exceptionFunction").data();
}
QString WinException::toString(bool includeLocation) const
{
QString rc;
QTextStream str(&rc);
#ifdef Q_OS_WIN
formatWindowsException(exceptionCode, exceptionAddress,
exceptionFlags, info1, info2, str);
#endif
if (includeLocation) {
if (lineNumber) {
str << " at " << QLatin1String(file) << ':' << lineNumber;
} else {
if (!function.isEmpty())
str << " in " << QLatin1String(function);
}
}
return rc;
}
QDebug operator<<(QDebug s, const WinException &e)
{
QDebug nsp = s.nospace();
nsp << "code=" << e.exceptionCode << ",flags=" << e.exceptionFlags
<< ",address=0x" << QString::number(e.exceptionAddress, 16)
<< ",firstChance=" << e.firstChance;
return s;
}
/*!
\fn DisassemblerLines parseCdbDisassembler(const QList<QByteArray> &a)
\brief Parse CDB disassembler output into DisassemblerLines (with helpers)
Expected options (prepend source file line):
\code
.asm source_line
.lines
\endcode
should cause the 'u' command to produce:
\code
gitgui!Foo::MainWindow::on_actionPtrs_triggered+0x1f9 [c:\qt\projects\gitgui\app\mainwindow.cpp @ 758]:
225 00000001`3fcebfe9 488b842410050000 mov rax,qword ptr [rsp+510h]
225 00000001`3fcebff1 8b4030 mov eax,dword ptr [rax+30h]
226 00000001`3fcebff4 ffc0 inc eax
00000001`3fcebff6 488b8c2410050000 mov rcx,qword ptr [rsp+510h]
...
QtCored4!QTextStreamPrivate::putString+0x34:
10 00000000`6e5e7f64 90 nop
...
\endcode
The algorithm checks for a function line and grabs the function name, offset and (optional)
source file from it.
Instruction lines are checked for address and source line number.
When the source line changes, the source instruction is inserted.
*/
// Parse a function header line: Match: 'nsp::foo+0x<offset> [<file> @ <line>]:'
// or 'nsp::foo+0x<offset>:', 'nsp::foo [<file> @ <line>]:'
// Do not use regexp here as it is hard for functions like operator+, operator[].
bool parseCdbDisassemblerFunctionLine(const QString &l,
QString *currentFunction, quint64 *functionOffset,
QString *sourceFile)
{
if (l.isEmpty() || !l.endsWith(QLatin1Char(':')) || l.at(0).isDigit() || l.at(0).isSpace())
return false;
int functionEnd = l.indexOf(QLatin1Char(' '));
if (functionEnd < 0)
functionEnd = l.size() - 1; // Nothing at all, just ':'
const int offsetPos = l.indexOf(QLatin1String("+0x"));
if (offsetPos > 0) {
*currentFunction = l.left(offsetPos);
*functionOffset = l.mid(offsetPos + 3, functionEnd - offsetPos - 3).trimmed().toULongLong(0, 16);
} else { // No offset, directly at beginning.
*currentFunction = l.left(functionEnd);
*functionOffset = 0;
}
sourceFile->clear();
// Parse file and line.
const int filePos = l.indexOf(QLatin1Char('['), functionEnd);
if (filePos == -1)
return true; // No file
const int linePos = l.indexOf(QLatin1String(" @ "), filePos + 1);
if (linePos == -1)
return false;
*sourceFile = l.mid(filePos + 1, linePos - filePos - 1).trimmed();
if (debugDisAsm)
qDebug() << "Function with source: " << l << currentFunction
<< functionOffset << sourceFile;
return true;
}
// Parse an instruction line:
// ' 21 00000001`3fcebff1 8b4030 mov eax,dword ptr [rax+30h]'
// '<source_line> <address> <raw data> <instruction>
bool parseCdbDisassemblerLine(const QString &lineIn, DisassemblerLine *dLine, uint *sourceLine)
{
*sourceLine = 0;
if (lineIn.size() < 6)
return false;
// Check source line: right-padded 5 digits
const bool hasSourceLine = lineIn.at(4).isDigit();
const QString line = lineIn.trimmed();
int addressPos = 0;
const QChar blank = QLatin1Char(' ');
// Optional source line.
if (hasSourceLine) {
const int sourceLineEnd = line.indexOf(blank);
if (sourceLineEnd == -1)
return false;
*sourceLine = line.left(sourceLineEnd).toUInt();
addressPos = sourceLineEnd + 1;
}
// Find positions of address/raw data/instruction
const int addressEnd = line.indexOf(blank, addressPos + 1);
if (addressEnd < 0)
return false;
const int rawDataPos = addressEnd + 1;
const int rawDataEnd = line.indexOf(blank, rawDataPos + 1);
if (rawDataEnd < 0)
return false;
const int instructionPos = rawDataEnd + 1;
bool ok;
QString addressS = line.mid(addressPos, addressEnd - addressPos);
if (addressS.size() > 9 && addressS.at(8) == QLatin1Char('`'))
addressS.remove(8, 1);
dLine->address = addressS.toULongLong(&ok, 16);
if (!ok)
return false;
dLine->rawData = QByteArray::fromHex(line.mid(rawDataPos, rawDataEnd - rawDataPos).toAscii());
dLine->data = line.right(line.size() - instructionPos).trimmed();
return true;
}
DisassemblerLines parseCdbDisassembler(const QList<QByteArray> &a)
{
DisassemblerLines result;
quint64 functionAddress = 0;
uint lastSourceLine = 0;
QString currentFunction;
quint64 functionOffset = 0;
QString sourceFile;
foreach (const QByteArray &lineBA, a) {
const QString line = QString::fromLatin1(lineBA);
// New function. Append as comment line.
if (parseCdbDisassemblerFunctionLine(line, &currentFunction, &functionOffset, &sourceFile)) {
functionAddress = 0;
DisassemblerLine commentLine;
commentLine.data = line;
result.appendLine(commentLine);
} else {
DisassemblerLine disassemblyLine;
uint sourceLine;
if (parseCdbDisassemblerLine(line, &disassemblyLine, &sourceLine)) {
// New source line: Add source code if available.
if (sourceLine && sourceLine != lastSourceLine) {
lastSourceLine = sourceLine;
result.appendSourceLine(sourceFile, sourceLine);
}
} else {
qWarning("Unable to parse assembly line '%s'", lineBA.constData());
disassemblyLine.fromString(line);
}
// Determine address of function from the first assembler line after a
// function header line.
if (!functionAddress && disassemblyLine.address) {
functionAddress = disassemblyLine.address - functionOffset;
}
if (functionAddress && disassemblyLine.address)
disassemblyLine.offset = disassemblyLine.address - functionAddress;
disassemblyLine.function = currentFunction;
result.appendLine(disassemblyLine);
}
}
return result;
}
} // namespace Internal
} // namespace Debugger