2022-08-19 15:59:36 +02:00
|
|
|
// Copyright (C) 2016 The Qt Company Ltd.
|
2022-12-21 10:12:09 +01:00
|
|
|
// SPDX-License-Identifier: LicenseRef-Qt-Commercial OR GPL-3.0-only WITH Qt-GPL-exception-1.0
|
2010-09-24 20:16:34 +02:00
|
|
|
|
2017-09-21 12:35:24 +02:00
|
|
|
#include "textutils.h"
|
2010-09-24 20:16:34 +02:00
|
|
|
|
2012-02-15 10:42:41 +01:00
|
|
|
#include <QTextDocument>
|
|
|
|
|
#include <QTextBlock>
|
2010-09-24 20:16:34 +02:00
|
|
|
|
2023-05-09 13:49:57 +02:00
|
|
|
namespace Utils::Text {
|
|
|
|
|
|
|
|
|
|
bool Position::operator==(const Position &other) const
|
|
|
|
|
{
|
|
|
|
|
return line == other.line && column == other.column;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int Range::length(const QString &text) const
|
|
|
|
|
{
|
|
|
|
|
if (begin.line == end.line)
|
|
|
|
|
return end.column - begin.column;
|
|
|
|
|
|
|
|
|
|
const int lineCount = end.line - begin.line;
|
|
|
|
|
int index = text.indexOf(QChar::LineFeed);
|
|
|
|
|
int currentLine = 1;
|
|
|
|
|
while (index > 0 && currentLine < lineCount) {
|
|
|
|
|
++index;
|
|
|
|
|
index = text.indexOf(QChar::LineFeed, index);
|
|
|
|
|
++currentLine;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (index < 0)
|
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
|
|
return index - begin.column + end.column;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool Range::operator==(const Range &other) const
|
|
|
|
|
{
|
|
|
|
|
return begin == other.begin && end == other.end;
|
|
|
|
|
}
|
2011-04-15 16:19:23 +02:00
|
|
|
|
|
|
|
|
bool convertPosition(const QTextDocument *document, int pos, int *line, int *column)
|
|
|
|
|
{
|
|
|
|
|
QTextBlock block = document->findBlock(pos);
|
|
|
|
|
if (!block.isValid()) {
|
|
|
|
|
(*line) = -1;
|
|
|
|
|
(*column) = -1;
|
|
|
|
|
return false;
|
|
|
|
|
} else {
|
2018-09-25 16:19:41 +02:00
|
|
|
// line and column are both 1-based
|
2011-04-15 16:19:23 +02:00
|
|
|
(*line) = block.blockNumber() + 1;
|
2018-09-25 16:19:41 +02:00
|
|
|
(*column) = pos - block.position() + 1;
|
2011-04-15 16:19:23 +02:00
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
}
|
2010-09-24 20:16:34 +02:00
|
|
|
|
2018-07-17 23:21:05 +03:00
|
|
|
OptionalLineColumn convertPosition(const QTextDocument *document, int pos)
|
2017-11-23 14:30:09 +01:00
|
|
|
{
|
2018-07-17 23:21:05 +03:00
|
|
|
OptionalLineColumn optional;
|
2017-11-23 14:30:09 +01:00
|
|
|
|
|
|
|
|
QTextBlock block = document->findBlock(pos);
|
|
|
|
|
|
|
|
|
|
if (block.isValid())
|
2023-05-09 14:08:41 +02:00
|
|
|
optional.emplace(block.blockNumber() + 1, pos - block.position());
|
2017-11-23 14:30:09 +01:00
|
|
|
|
|
|
|
|
return optional;
|
|
|
|
|
}
|
|
|
|
|
|
2018-07-13 12:33:46 +02:00
|
|
|
int positionInText(const QTextDocument *textDocument, int line, int column)
|
2018-06-15 14:33:01 +02:00
|
|
|
{
|
|
|
|
|
// Deduct 1 from line and column since they are 1-based.
|
|
|
|
|
// Column should already be converted from UTF-8 byte offset to the TextEditor column.
|
|
|
|
|
return textDocument->findBlockByNumber(line - 1).position() + column - 1;
|
|
|
|
|
}
|
|
|
|
|
|
2011-04-15 16:19:23 +02:00
|
|
|
QString textAt(QTextCursor tc, int pos, int length)
|
2010-09-24 20:16:34 +02:00
|
|
|
{
|
2011-04-15 16:19:23 +02:00
|
|
|
if (pos < 0)
|
|
|
|
|
pos = 0;
|
|
|
|
|
tc.movePosition(QTextCursor::End);
|
|
|
|
|
if (pos + length > tc.position())
|
|
|
|
|
length = tc.position() - pos;
|
2010-09-24 20:16:34 +02:00
|
|
|
|
2011-04-15 16:19:23 +02:00
|
|
|
tc.setPosition(pos);
|
|
|
|
|
tc.setPosition(pos + length, QTextCursor::KeepAnchor);
|
2010-09-24 20:16:34 +02:00
|
|
|
|
2014-03-22 20:24:55 +02:00
|
|
|
// selectedText() returns U+2029 (PARAGRAPH SEPARATOR) instead of newline
|
|
|
|
|
return tc.selectedText().replace(QChar::ParagraphSeparator, QLatin1Char('\n'));
|
2011-04-15 16:19:23 +02:00
|
|
|
}
|
2010-09-24 20:16:34 +02:00
|
|
|
|
2019-07-24 18:40:10 +02:00
|
|
|
QTextCursor selectAt(QTextCursor textCursor, int line, int column, uint length)
|
2016-08-04 15:26:53 +02:00
|
|
|
{
|
|
|
|
|
if (line < 1)
|
|
|
|
|
line = 1;
|
|
|
|
|
|
|
|
|
|
if (column < 1)
|
|
|
|
|
column = 1;
|
|
|
|
|
|
2021-09-29 09:18:04 +02:00
|
|
|
const int anchorPosition = positionInText(textCursor.document(), line, column);
|
2020-06-08 13:30:17 +02:00
|
|
|
textCursor.setPosition(anchorPosition);
|
2021-09-29 09:18:04 +02:00
|
|
|
textCursor.setPosition(anchorPosition + int(length), QTextCursor::KeepAnchor);
|
2016-08-04 15:26:53 +02:00
|
|
|
|
|
|
|
|
return textCursor;
|
|
|
|
|
}
|
|
|
|
|
|
2015-12-20 19:59:00 +01:00
|
|
|
QTextCursor flippedCursor(const QTextCursor &cursor)
|
|
|
|
|
{
|
|
|
|
|
QTextCursor flipped = cursor;
|
|
|
|
|
flipped.clearSelection();
|
|
|
|
|
flipped.setPosition(cursor.anchor(), QTextCursor::KeepAnchor);
|
|
|
|
|
return flipped;
|
|
|
|
|
}
|
|
|
|
|
|
2017-06-29 16:35:48 +02:00
|
|
|
static bool isValidIdentifierChar(const QChar &c)
|
|
|
|
|
{
|
|
|
|
|
return c.isLetter()
|
|
|
|
|
|| c.isNumber()
|
|
|
|
|
|| c == QLatin1Char('_')
|
|
|
|
|
|| c.isHighSurrogate()
|
|
|
|
|
|| c.isLowSurrogate();
|
|
|
|
|
}
|
|
|
|
|
|
2017-08-03 16:43:38 +02:00
|
|
|
static bool isAfterOperatorKeyword(QTextCursor cursor)
|
|
|
|
|
{
|
|
|
|
|
cursor.movePosition(QTextCursor::PreviousWord);
|
|
|
|
|
cursor.movePosition(QTextCursor::EndOfWord, QTextCursor::KeepAnchor);
|
|
|
|
|
return cursor.selectedText() == "operator";
|
|
|
|
|
}
|
|
|
|
|
|
2017-06-29 16:35:48 +02:00
|
|
|
QTextCursor wordStartCursor(const QTextCursor &textCursor)
|
|
|
|
|
{
|
|
|
|
|
const int originalPosition = textCursor.position();
|
|
|
|
|
QTextCursor cursor(textCursor);
|
|
|
|
|
cursor.movePosition(QTextCursor::StartOfWord);
|
|
|
|
|
const int wordStartPosition = cursor.position();
|
|
|
|
|
|
|
|
|
|
if (originalPosition == wordStartPosition) {
|
|
|
|
|
// Cursor is not on an identifier, check whether we are right after one.
|
|
|
|
|
const QChar c = textCursor.document()->characterAt(originalPosition - 1);
|
|
|
|
|
if (isValidIdentifierChar(c))
|
|
|
|
|
cursor.movePosition(QTextCursor::PreviousWord);
|
|
|
|
|
}
|
2017-08-03 16:43:38 +02:00
|
|
|
if (isAfterOperatorKeyword(cursor))
|
|
|
|
|
cursor.movePosition(QTextCursor::PreviousWord);
|
2017-06-29 16:35:48 +02:00
|
|
|
|
|
|
|
|
return cursor;
|
|
|
|
|
}
|
|
|
|
|
|
2019-02-12 13:08:46 +01:00
|
|
|
QString wordUnderCursor(const QTextCursor &cursor)
|
|
|
|
|
{
|
|
|
|
|
QTextCursor tc(cursor);
|
|
|
|
|
tc.select(QTextCursor::WordUnderCursor);
|
|
|
|
|
return tc.selectedText();
|
|
|
|
|
}
|
|
|
|
|
|
2018-10-11 14:11:43 +02:00
|
|
|
int utf8NthLineOffset(const QTextDocument *textDocument, const QByteArray &buffer, int line)
|
|
|
|
|
{
|
2018-12-11 09:40:50 +01:00
|
|
|
if (textDocument->blockCount() < line)
|
|
|
|
|
return -1;
|
|
|
|
|
|
2018-10-11 14:11:43 +02:00
|
|
|
if (textDocument->characterCount() == buffer.size() + 1)
|
|
|
|
|
return textDocument->findBlockByNumber(line - 1).position();
|
|
|
|
|
|
2018-10-17 11:00:24 +02:00
|
|
|
int utf8Offset = 0;
|
2018-10-11 14:11:43 +02:00
|
|
|
for (int count = 0; count < line - 1; ++count) {
|
2018-10-17 11:00:24 +02:00
|
|
|
utf8Offset = buffer.indexOf('\n', utf8Offset);
|
|
|
|
|
if (utf8Offset == -1)
|
|
|
|
|
return -1; // The line does not exist.
|
|
|
|
|
++utf8Offset;
|
2018-10-11 14:11:43 +02:00
|
|
|
}
|
2018-10-17 11:00:24 +02:00
|
|
|
return utf8Offset;
|
2018-10-11 14:11:43 +02:00
|
|
|
}
|
|
|
|
|
|
2019-02-19 14:30:52 +01:00
|
|
|
LineColumn utf16LineColumn(const QByteArray &utf8Buffer, int utf8Offset)
|
|
|
|
|
{
|
2022-05-24 13:45:35 +02:00
|
|
|
LineColumn lineColumn;
|
2019-02-19 14:30:52 +01:00
|
|
|
lineColumn.line = static_cast<int>(
|
|
|
|
|
std::count(utf8Buffer.begin(), utf8Buffer.begin() + utf8Offset, '\n'))
|
|
|
|
|
+ 1;
|
2019-03-06 13:04:34 +01:00
|
|
|
const int startOfLineOffset = utf8Offset ? (utf8Buffer.lastIndexOf('\n', utf8Offset - 1) + 1)
|
|
|
|
|
: 0;
|
2019-02-19 14:30:52 +01:00
|
|
|
lineColumn.column = QString::fromUtf8(
|
|
|
|
|
utf8Buffer.mid(startOfLineOffset, utf8Offset - startOfLineOffset))
|
2023-05-09 14:08:41 +02:00
|
|
|
.length();
|
2019-02-19 14:30:52 +01:00
|
|
|
return lineColumn;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
QString utf16LineTextInUtf8Buffer(const QByteArray &utf8Buffer, int currentUtf8Offset)
|
|
|
|
|
{
|
2019-03-06 13:04:34 +01:00
|
|
|
const int lineStartUtf8Offset = currentUtf8Offset
|
|
|
|
|
? (utf8Buffer.lastIndexOf('\n', currentUtf8Offset - 1) + 1)
|
|
|
|
|
: 0;
|
2019-02-19 14:30:52 +01:00
|
|
|
const int lineEndUtf8Offset = utf8Buffer.indexOf('\n', currentUtf8Offset);
|
|
|
|
|
return QString::fromUtf8(
|
|
|
|
|
utf8Buffer.mid(lineStartUtf8Offset, lineEndUtf8Offset - lineStartUtf8Offset));
|
|
|
|
|
}
|
|
|
|
|
|
2019-07-24 09:34:50 +02:00
|
|
|
static bool isByteOfMultiByteCodePoint(unsigned char byte)
|
|
|
|
|
{
|
|
|
|
|
return byte & 0x80; // Check if most significant bit is set
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool utf8AdvanceCodePoint(const char *¤t)
|
|
|
|
|
{
|
|
|
|
|
if (Q_UNLIKELY(*current == '\0'))
|
|
|
|
|
return false;
|
|
|
|
|
|
|
|
|
|
// Process multi-byte UTF-8 code point (non-latin1)
|
|
|
|
|
if (Q_UNLIKELY(isByteOfMultiByteCodePoint(*current))) {
|
|
|
|
|
unsigned trailingBytesCurrentCodePoint = 1;
|
|
|
|
|
for (unsigned char c = (*current) << 2; isByteOfMultiByteCodePoint(c); c <<= 1)
|
|
|
|
|
++trailingBytesCurrentCodePoint;
|
|
|
|
|
current += trailingBytesCurrentCodePoint + 1;
|
|
|
|
|
|
|
|
|
|
// Process single-byte UTF-8 code point (latin1)
|
|
|
|
|
} else {
|
|
|
|
|
++current;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2019-11-18 10:38:35 +01:00
|
|
|
void applyReplacements(QTextDocument *doc, const Replacements &replacements)
|
|
|
|
|
{
|
|
|
|
|
if (replacements.empty())
|
|
|
|
|
return;
|
|
|
|
|
|
|
|
|
|
int fullOffsetShift = 0;
|
|
|
|
|
QTextCursor editCursor(doc);
|
|
|
|
|
editCursor.beginEditBlock();
|
2022-05-24 13:45:35 +02:00
|
|
|
for (const Text::Replacement &replacement : replacements) {
|
2019-11-18 10:38:35 +01:00
|
|
|
editCursor.setPosition(replacement.offset + fullOffsetShift);
|
|
|
|
|
editCursor.movePosition(QTextCursor::NextCharacter,
|
|
|
|
|
QTextCursor::KeepAnchor,
|
|
|
|
|
replacement.length);
|
|
|
|
|
editCursor.removeSelectedText();
|
|
|
|
|
editCursor.insertText(replacement.text);
|
|
|
|
|
fullOffsetShift += replacement.text.length() - replacement.length;
|
|
|
|
|
}
|
|
|
|
|
editCursor.endEditBlock();
|
|
|
|
|
}
|
|
|
|
|
|
2023-05-09 13:49:57 +02:00
|
|
|
} // namespace Utils::Text
|