481 lines
14 KiB
C++
481 lines
14 KiB
C++
//===- EditedSource.cpp - Collection of source edits ----------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "clang/Edit/EditedSource.h"
|
|
#include "clang/Basic/CharInfo.h"
|
|
#include "clang/Basic/LLVM.h"
|
|
#include "clang/Basic/SourceLocation.h"
|
|
#include "clang/Basic/SourceManager.h"
|
|
#include "clang/Edit/Commit.h"
|
|
#include "clang/Edit/EditsReceiver.h"
|
|
#include "clang/Edit/FileOffset.h"
|
|
#include "clang/Lex/Lexer.h"
|
|
#include "llvm/ADT/STLExtras.h"
|
|
#include "llvm/ADT/SmallString.h"
|
|
#include "llvm/ADT/StringRef.h"
|
|
#include "llvm/ADT/Twine.h"
|
|
#include <algorithm>
|
|
#include <cassert>
|
|
#include <tuple>
|
|
#include <utility>
|
|
|
|
using namespace clang;
|
|
using namespace edit;
|
|
|
|
void EditsReceiver::remove(CharSourceRange range) {
|
|
replace(range, StringRef());
|
|
}
|
|
|
|
void EditedSource::deconstructMacroArgLoc(SourceLocation Loc,
|
|
SourceLocation &ExpansionLoc,
|
|
MacroArgUse &ArgUse) {
|
|
assert(SourceMgr.isMacroArgExpansion(Loc));
|
|
SourceLocation DefArgLoc =
|
|
SourceMgr.getImmediateExpansionRange(Loc).getBegin();
|
|
SourceLocation ImmediateExpansionLoc =
|
|
SourceMgr.getImmediateExpansionRange(DefArgLoc).getBegin();
|
|
ExpansionLoc = ImmediateExpansionLoc;
|
|
while (SourceMgr.isMacroBodyExpansion(ExpansionLoc))
|
|
ExpansionLoc =
|
|
SourceMgr.getImmediateExpansionRange(ExpansionLoc).getBegin();
|
|
SmallString<20> Buf;
|
|
StringRef ArgName = Lexer::getSpelling(SourceMgr.getSpellingLoc(DefArgLoc),
|
|
Buf, SourceMgr, LangOpts);
|
|
ArgUse = MacroArgUse{nullptr, SourceLocation(), SourceLocation()};
|
|
if (!ArgName.empty())
|
|
ArgUse = {&IdentTable.get(ArgName), ImmediateExpansionLoc,
|
|
SourceMgr.getSpellingLoc(DefArgLoc)};
|
|
}
|
|
|
|
void EditedSource::startingCommit() {}
|
|
|
|
void EditedSource::finishedCommit() {
|
|
for (auto &ExpArg : CurrCommitMacroArgExps) {
|
|
SourceLocation ExpLoc;
|
|
MacroArgUse ArgUse;
|
|
std::tie(ExpLoc, ArgUse) = ExpArg;
|
|
auto &ArgUses = ExpansionToArgMap[ExpLoc];
|
|
if (llvm::find(ArgUses, ArgUse) == ArgUses.end())
|
|
ArgUses.push_back(ArgUse);
|
|
}
|
|
CurrCommitMacroArgExps.clear();
|
|
}
|
|
|
|
StringRef EditedSource::copyString(const Twine &twine) {
|
|
SmallString<128> Data;
|
|
return copyString(twine.toStringRef(Data));
|
|
}
|
|
|
|
bool EditedSource::canInsertInOffset(SourceLocation OrigLoc, FileOffset Offs) {
|
|
FileEditsTy::iterator FA = getActionForOffset(Offs);
|
|
if (FA != FileEdits.end()) {
|
|
if (FA->first != Offs)
|
|
return false; // position has been removed.
|
|
}
|
|
|
|
if (SourceMgr.isMacroArgExpansion(OrigLoc)) {
|
|
SourceLocation ExpLoc;
|
|
MacroArgUse ArgUse;
|
|
deconstructMacroArgLoc(OrigLoc, ExpLoc, ArgUse);
|
|
auto I = ExpansionToArgMap.find(ExpLoc);
|
|
if (I != ExpansionToArgMap.end() &&
|
|
find_if(I->second, [&](const MacroArgUse &U) {
|
|
return ArgUse.Identifier == U.Identifier &&
|
|
std::tie(ArgUse.ImmediateExpansionLoc, ArgUse.UseLoc) !=
|
|
std::tie(U.ImmediateExpansionLoc, U.UseLoc);
|
|
}) != I->second.end()) {
|
|
// Trying to write in a macro argument input that has already been
|
|
// written by a previous commit for another expansion of the same macro
|
|
// argument name. For example:
|
|
//
|
|
// \code
|
|
// #define MAC(x) ((x)+(x))
|
|
// MAC(a)
|
|
// \endcode
|
|
//
|
|
// A commit modified the macro argument 'a' due to the first '(x)'
|
|
// expansion inside the macro definition, and a subsequent commit tried
|
|
// to modify 'a' again for the second '(x)' expansion. The edits of the
|
|
// second commit will be rejected.
|
|
return false;
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool EditedSource::commitInsert(SourceLocation OrigLoc,
|
|
FileOffset Offs, StringRef text,
|
|
bool beforePreviousInsertions) {
|
|
if (!canInsertInOffset(OrigLoc, Offs))
|
|
return false;
|
|
if (text.empty())
|
|
return true;
|
|
|
|
if (SourceMgr.isMacroArgExpansion(OrigLoc)) {
|
|
MacroArgUse ArgUse;
|
|
SourceLocation ExpLoc;
|
|
deconstructMacroArgLoc(OrigLoc, ExpLoc, ArgUse);
|
|
if (ArgUse.Identifier)
|
|
CurrCommitMacroArgExps.emplace_back(ExpLoc, ArgUse);
|
|
}
|
|
|
|
FileEdit &FA = FileEdits[Offs];
|
|
if (FA.Text.empty()) {
|
|
FA.Text = copyString(text);
|
|
return true;
|
|
}
|
|
|
|
if (beforePreviousInsertions)
|
|
FA.Text = copyString(Twine(text) + FA.Text);
|
|
else
|
|
FA.Text = copyString(Twine(FA.Text) + text);
|
|
|
|
return true;
|
|
}
|
|
|
|
bool EditedSource::commitInsertFromRange(SourceLocation OrigLoc,
|
|
FileOffset Offs,
|
|
FileOffset InsertFromRangeOffs, unsigned Len,
|
|
bool beforePreviousInsertions) {
|
|
if (Len == 0)
|
|
return true;
|
|
|
|
SmallString<128> StrVec;
|
|
FileOffset BeginOffs = InsertFromRangeOffs;
|
|
FileOffset EndOffs = BeginOffs.getWithOffset(Len);
|
|
FileEditsTy::iterator I = FileEdits.upper_bound(BeginOffs);
|
|
if (I != FileEdits.begin())
|
|
--I;
|
|
|
|
for (; I != FileEdits.end(); ++I) {
|
|
FileEdit &FA = I->second;
|
|
FileOffset B = I->first;
|
|
FileOffset E = B.getWithOffset(FA.RemoveLen);
|
|
|
|
if (BeginOffs == B)
|
|
break;
|
|
|
|
if (BeginOffs < E) {
|
|
if (BeginOffs > B) {
|
|
BeginOffs = E;
|
|
++I;
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
for (; I != FileEdits.end() && EndOffs > I->first; ++I) {
|
|
FileEdit &FA = I->second;
|
|
FileOffset B = I->first;
|
|
FileOffset E = B.getWithOffset(FA.RemoveLen);
|
|
|
|
if (BeginOffs < B) {
|
|
bool Invalid = false;
|
|
StringRef text = getSourceText(BeginOffs, B, Invalid);
|
|
if (Invalid)
|
|
return false;
|
|
StrVec += text;
|
|
}
|
|
StrVec += FA.Text;
|
|
BeginOffs = E;
|
|
}
|
|
|
|
if (BeginOffs < EndOffs) {
|
|
bool Invalid = false;
|
|
StringRef text = getSourceText(BeginOffs, EndOffs, Invalid);
|
|
if (Invalid)
|
|
return false;
|
|
StrVec += text;
|
|
}
|
|
|
|
return commitInsert(OrigLoc, Offs, StrVec, beforePreviousInsertions);
|
|
}
|
|
|
|
void EditedSource::commitRemove(SourceLocation OrigLoc,
|
|
FileOffset BeginOffs, unsigned Len) {
|
|
if (Len == 0)
|
|
return;
|
|
|
|
FileOffset EndOffs = BeginOffs.getWithOffset(Len);
|
|
FileEditsTy::iterator I = FileEdits.upper_bound(BeginOffs);
|
|
if (I != FileEdits.begin())
|
|
--I;
|
|
|
|
for (; I != FileEdits.end(); ++I) {
|
|
FileEdit &FA = I->second;
|
|
FileOffset B = I->first;
|
|
FileOffset E = B.getWithOffset(FA.RemoveLen);
|
|
|
|
if (BeginOffs < E)
|
|
break;
|
|
}
|
|
|
|
FileOffset TopBegin, TopEnd;
|
|
FileEdit *TopFA = nullptr;
|
|
|
|
if (I == FileEdits.end()) {
|
|
FileEditsTy::iterator
|
|
NewI = FileEdits.insert(I, std::make_pair(BeginOffs, FileEdit()));
|
|
NewI->second.RemoveLen = Len;
|
|
return;
|
|
}
|
|
|
|
FileEdit &FA = I->second;
|
|
FileOffset B = I->first;
|
|
FileOffset E = B.getWithOffset(FA.RemoveLen);
|
|
if (BeginOffs < B) {
|
|
FileEditsTy::iterator
|
|
NewI = FileEdits.insert(I, std::make_pair(BeginOffs, FileEdit()));
|
|
TopBegin = BeginOffs;
|
|
TopEnd = EndOffs;
|
|
TopFA = &NewI->second;
|
|
TopFA->RemoveLen = Len;
|
|
} else {
|
|
TopBegin = B;
|
|
TopEnd = E;
|
|
TopFA = &I->second;
|
|
if (TopEnd >= EndOffs)
|
|
return;
|
|
unsigned diff = EndOffs.getOffset() - TopEnd.getOffset();
|
|
TopEnd = EndOffs;
|
|
TopFA->RemoveLen += diff;
|
|
if (B == BeginOffs)
|
|
TopFA->Text = StringRef();
|
|
++I;
|
|
}
|
|
|
|
while (I != FileEdits.end()) {
|
|
FileEdit &FA = I->second;
|
|
FileOffset B = I->first;
|
|
FileOffset E = B.getWithOffset(FA.RemoveLen);
|
|
|
|
if (B >= TopEnd)
|
|
break;
|
|
|
|
if (E <= TopEnd) {
|
|
FileEdits.erase(I++);
|
|
continue;
|
|
}
|
|
|
|
if (B < TopEnd) {
|
|
unsigned diff = E.getOffset() - TopEnd.getOffset();
|
|
TopEnd = E;
|
|
TopFA->RemoveLen += diff;
|
|
FileEdits.erase(I);
|
|
}
|
|
|
|
break;
|
|
}
|
|
}
|
|
|
|
bool EditedSource::commit(const Commit &commit) {
|
|
if (!commit.isCommitable())
|
|
return false;
|
|
|
|
struct CommitRAII {
|
|
EditedSource &Editor;
|
|
|
|
CommitRAII(EditedSource &Editor) : Editor(Editor) {
|
|
Editor.startingCommit();
|
|
}
|
|
|
|
~CommitRAII() {
|
|
Editor.finishedCommit();
|
|
}
|
|
} CommitRAII(*this);
|
|
|
|
for (edit::Commit::edit_iterator
|
|
I = commit.edit_begin(), E = commit.edit_end(); I != E; ++I) {
|
|
const edit::Commit::Edit &edit = *I;
|
|
switch (edit.Kind) {
|
|
case edit::Commit::Act_Insert:
|
|
commitInsert(edit.OrigLoc, edit.Offset, edit.Text, edit.BeforePrev);
|
|
break;
|
|
case edit::Commit::Act_InsertFromRange:
|
|
commitInsertFromRange(edit.OrigLoc, edit.Offset,
|
|
edit.InsertFromRangeOffs, edit.Length,
|
|
edit.BeforePrev);
|
|
break;
|
|
case edit::Commit::Act_Remove:
|
|
commitRemove(edit.OrigLoc, edit.Offset, edit.Length);
|
|
break;
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
// Returns true if it is ok to make the two given characters adjacent.
|
|
static bool canBeJoined(char left, char right, const LangOptions &LangOpts) {
|
|
// FIXME: Should use TokenConcatenation to make sure we don't allow stuff like
|
|
// making two '<' adjacent.
|
|
return !(Lexer::isIdentifierBodyChar(left, LangOpts) &&
|
|
Lexer::isIdentifierBodyChar(right, LangOpts));
|
|
}
|
|
|
|
/// Returns true if it is ok to eliminate the trailing whitespace between
|
|
/// the given characters.
|
|
static bool canRemoveWhitespace(char left, char beforeWSpace, char right,
|
|
const LangOptions &LangOpts) {
|
|
if (!canBeJoined(left, right, LangOpts))
|
|
return false;
|
|
if (isWhitespace(left) || isWhitespace(right))
|
|
return true;
|
|
if (canBeJoined(beforeWSpace, right, LangOpts))
|
|
return false; // the whitespace was intentional, keep it.
|
|
return true;
|
|
}
|
|
|
|
/// Check the range that we are going to remove and:
|
|
/// -Remove any trailing whitespace if possible.
|
|
/// -Insert a space if removing the range is going to mess up the source tokens.
|
|
static void adjustRemoval(const SourceManager &SM, const LangOptions &LangOpts,
|
|
SourceLocation Loc, FileOffset offs,
|
|
unsigned &len, StringRef &text) {
|
|
assert(len && text.empty());
|
|
SourceLocation BeginTokLoc = Lexer::GetBeginningOfToken(Loc, SM, LangOpts);
|
|
if (BeginTokLoc != Loc)
|
|
return; // the range is not at the beginning of a token, keep the range.
|
|
|
|
bool Invalid = false;
|
|
StringRef buffer = SM.getBufferData(offs.getFID(), &Invalid);
|
|
if (Invalid)
|
|
return;
|
|
|
|
unsigned begin = offs.getOffset();
|
|
unsigned end = begin + len;
|
|
|
|
// Do not try to extend the removal if we're at the end of the buffer already.
|
|
if (end == buffer.size())
|
|
return;
|
|
|
|
assert(begin < buffer.size() && end < buffer.size() && "Invalid range!");
|
|
|
|
// FIXME: Remove newline.
|
|
|
|
if (begin == 0) {
|
|
if (buffer[end] == ' ')
|
|
++len;
|
|
return;
|
|
}
|
|
|
|
if (buffer[end] == ' ') {
|
|
assert((end + 1 != buffer.size() || buffer.data()[end + 1] == 0) &&
|
|
"buffer not zero-terminated!");
|
|
if (canRemoveWhitespace(/*left=*/buffer[begin-1],
|
|
/*beforeWSpace=*/buffer[end-1],
|
|
/*right=*/buffer.data()[end + 1], // zero-terminated
|
|
LangOpts))
|
|
++len;
|
|
return;
|
|
}
|
|
|
|
if (!canBeJoined(buffer[begin-1], buffer[end], LangOpts))
|
|
text = " ";
|
|
}
|
|
|
|
static void applyRewrite(EditsReceiver &receiver,
|
|
StringRef text, FileOffset offs, unsigned len,
|
|
const SourceManager &SM, const LangOptions &LangOpts,
|
|
bool shouldAdjustRemovals) {
|
|
assert(offs.getFID().isValid());
|
|
SourceLocation Loc = SM.getLocForStartOfFile(offs.getFID());
|
|
Loc = Loc.getLocWithOffset(offs.getOffset());
|
|
assert(Loc.isFileID());
|
|
|
|
if (text.empty() && shouldAdjustRemovals)
|
|
adjustRemoval(SM, LangOpts, Loc, offs, len, text);
|
|
|
|
CharSourceRange range = CharSourceRange::getCharRange(Loc,
|
|
Loc.getLocWithOffset(len));
|
|
|
|
if (text.empty()) {
|
|
assert(len);
|
|
receiver.remove(range);
|
|
return;
|
|
}
|
|
|
|
if (len)
|
|
receiver.replace(range, text);
|
|
else
|
|
receiver.insert(Loc, text);
|
|
}
|
|
|
|
void EditedSource::applyRewrites(EditsReceiver &receiver,
|
|
bool shouldAdjustRemovals) {
|
|
SmallString<128> StrVec;
|
|
FileOffset CurOffs, CurEnd;
|
|
unsigned CurLen;
|
|
|
|
if (FileEdits.empty())
|
|
return;
|
|
|
|
FileEditsTy::iterator I = FileEdits.begin();
|
|
CurOffs = I->first;
|
|
StrVec = I->second.Text;
|
|
CurLen = I->second.RemoveLen;
|
|
CurEnd = CurOffs.getWithOffset(CurLen);
|
|
++I;
|
|
|
|
for (FileEditsTy::iterator E = FileEdits.end(); I != E; ++I) {
|
|
FileOffset offs = I->first;
|
|
FileEdit act = I->second;
|
|
assert(offs >= CurEnd);
|
|
|
|
if (offs == CurEnd) {
|
|
StrVec += act.Text;
|
|
CurLen += act.RemoveLen;
|
|
CurEnd.getWithOffset(act.RemoveLen);
|
|
continue;
|
|
}
|
|
|
|
applyRewrite(receiver, StrVec, CurOffs, CurLen, SourceMgr, LangOpts,
|
|
shouldAdjustRemovals);
|
|
CurOffs = offs;
|
|
StrVec = act.Text;
|
|
CurLen = act.RemoveLen;
|
|
CurEnd = CurOffs.getWithOffset(CurLen);
|
|
}
|
|
|
|
applyRewrite(receiver, StrVec, CurOffs, CurLen, SourceMgr, LangOpts,
|
|
shouldAdjustRemovals);
|
|
}
|
|
|
|
void EditedSource::clearRewrites() {
|
|
FileEdits.clear();
|
|
StrAlloc.Reset();
|
|
}
|
|
|
|
StringRef EditedSource::getSourceText(FileOffset BeginOffs, FileOffset EndOffs,
|
|
bool &Invalid) {
|
|
assert(BeginOffs.getFID() == EndOffs.getFID());
|
|
assert(BeginOffs <= EndOffs);
|
|
SourceLocation BLoc = SourceMgr.getLocForStartOfFile(BeginOffs.getFID());
|
|
BLoc = BLoc.getLocWithOffset(BeginOffs.getOffset());
|
|
assert(BLoc.isFileID());
|
|
SourceLocation
|
|
ELoc = BLoc.getLocWithOffset(EndOffs.getOffset() - BeginOffs.getOffset());
|
|
return Lexer::getSourceText(CharSourceRange::getCharRange(BLoc, ELoc),
|
|
SourceMgr, LangOpts, &Invalid);
|
|
}
|
|
|
|
EditedSource::FileEditsTy::iterator
|
|
EditedSource::getActionForOffset(FileOffset Offs) {
|
|
FileEditsTy::iterator I = FileEdits.upper_bound(Offs);
|
|
if (I == FileEdits.begin())
|
|
return FileEdits.end();
|
|
--I;
|
|
FileEdit &FA = I->second;
|
|
FileOffset B = I->first;
|
|
FileOffset E = B.getWithOffset(FA.RemoveLen);
|
|
if (Offs >= B && Offs < E)
|
|
return I;
|
|
|
|
return FileEdits.end();
|
|
}
|