10e7edcfeSLei Zhang //===- ToolUtilities.cpp - MLIR Tool Utilities ----------------------------===//
20e7edcfeSLei Zhang //
330857107SMehdi Amini // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
456222a06SMehdi Amini // See https://llvm.org/LICENSE.txt for license information.
556222a06SMehdi Amini // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60e7edcfeSLei Zhang //
756222a06SMehdi Amini //===----------------------------------------------------------------------===//
80e7edcfeSLei Zhang //
90e7edcfeSLei Zhang // This file defines common utilities for implementing MLIR tools.
100e7edcfeSLei Zhang //
110e7edcfeSLei Zhang //===----------------------------------------------------------------------===//
120e7edcfeSLei Zhang
130e7edcfeSLei Zhang #include "mlir/Support/ToolUtilities.h"
140e7edcfeSLei Zhang #include "mlir/Support/LLVM.h"
150e7edcfeSLei Zhang #include "llvm/Support/SourceMgr.h"
16efb7727aSJacques Pienaar #include "llvm/Support/raw_ostream.h"
170e7edcfeSLei Zhang
180e7edcfeSLei Zhang using namespace mlir;
190e7edcfeSLei Zhang
200e7edcfeSLei Zhang LogicalResult
splitAndProcessBuffer(std::unique_ptr<llvm::MemoryBuffer> originalBuffer,ChunkBufferHandler processChunkBuffer,raw_ostream & os,llvm::StringRef inputSplitMarker,llvm::StringRef outputSplitMarker)210e7edcfeSLei Zhang mlir::splitAndProcessBuffer(std::unique_ptr<llvm::MemoryBuffer> originalBuffer,
220e7edcfeSLei Zhang ChunkBufferHandler processChunkBuffer,
23*516ccce7SIngo Müller raw_ostream &os, llvm::StringRef inputSplitMarker,
24*516ccce7SIngo Müller llvm::StringRef outputSplitMarker) {
259560f021SRiver Riddle // If splitting is disabled, we process the full input buffer.
26*516ccce7SIngo Müller if (inputSplitMarker.empty())
279560f021SRiver Riddle return processChunkBuffer(std::move(originalBuffer), os);
289560f021SRiver Riddle
29*516ccce7SIngo Müller const int inputSplitMarkerLen = inputSplitMarker.size();
300e7edcfeSLei Zhang
310e7edcfeSLei Zhang auto *origMemBuffer = originalBuffer.get();
32efb7727aSJacques Pienaar SmallVector<StringRef, 8> rawSourceBuffers;
33efb7727aSJacques Pienaar const int checkLen = 2;
34efb7727aSJacques Pienaar // Split dropping the last checkLen chars to enable flagging near misses.
35efb7727aSJacques Pienaar origMemBuffer->getBuffer().split(rawSourceBuffers,
36*516ccce7SIngo Müller inputSplitMarker.drop_back(checkLen));
37efb7727aSJacques Pienaar if (rawSourceBuffers.empty())
38efb7727aSJacques Pienaar return success();
390e7edcfeSLei Zhang
400e7edcfeSLei Zhang // Add the original buffer to the source manager.
410e7edcfeSLei Zhang llvm::SourceMgr fileSourceMgr;
426842ec42SRiver Riddle fileSourceMgr.AddNewSourceBuffer(std::move(originalBuffer), SMLoc());
430e7edcfeSLei Zhang
44efb7727aSJacques Pienaar // Flag near misses by iterating over all the sub-buffers found when splitting
45efb7727aSJacques Pienaar // with the prefix of the splitMarker. Use a sliding window where we only add
46efb7727aSJacques Pienaar // a buffer as a sourceBuffer if terminated by a full match of the
47efb7727aSJacques Pienaar // splitMarker, else flag a warning (if near miss) and extend the size of the
48efb7727aSJacques Pienaar // buffer under consideration.
49efb7727aSJacques Pienaar SmallVector<StringRef, 8> sourceBuffers;
50efb7727aSJacques Pienaar StringRef prev;
51efb7727aSJacques Pienaar for (auto buffer : rawSourceBuffers) {
52efb7727aSJacques Pienaar if (prev.empty()) {
53efb7727aSJacques Pienaar prev = buffer;
54efb7727aSJacques Pienaar continue;
55efb7727aSJacques Pienaar }
56efb7727aSJacques Pienaar
57efb7727aSJacques Pienaar // Check that suffix is as expected and doesn't have any dash post.
58*516ccce7SIngo Müller bool expectedSuffix =
59*516ccce7SIngo Müller buffer.starts_with(inputSplitMarker.take_back(checkLen)) &&
60efb7727aSJacques Pienaar buffer.size() > checkLen && buffer[checkLen] != '0';
61efb7727aSJacques Pienaar if (expectedSuffix) {
62efb7727aSJacques Pienaar sourceBuffers.push_back(prev);
63efb7727aSJacques Pienaar prev = buffer.drop_front(checkLen);
64efb7727aSJacques Pienaar } else {
65efb7727aSJacques Pienaar // TODO: Consider making this a failure.
666842ec42SRiver Riddle auto splitLoc = SMLoc::getFromPointer(buffer.data());
67efb7727aSJacques Pienaar fileSourceMgr.PrintMessage(llvm::errs(), splitLoc,
68efb7727aSJacques Pienaar llvm::SourceMgr::DK_Warning,
69efb7727aSJacques Pienaar "near miss with file split marker");
70*516ccce7SIngo Müller prev = StringRef(prev.data(), prev.size() + inputSplitMarkerLen -
71*516ccce7SIngo Müller checkLen + buffer.size());
72efb7727aSJacques Pienaar }
73efb7727aSJacques Pienaar }
74efb7727aSJacques Pienaar if (!prev.empty())
75efb7727aSJacques Pienaar sourceBuffers.push_back(prev);
76efb7727aSJacques Pienaar
770e7edcfeSLei Zhang // Process each chunk in turn.
780e7edcfeSLei Zhang bool hadFailure = false;
799560f021SRiver Riddle auto interleaveFn = [&](StringRef subBuffer) {
806842ec42SRiver Riddle auto splitLoc = SMLoc::getFromPointer(subBuffer.data());
810e7edcfeSLei Zhang unsigned splitLine = fileSourceMgr.getLineAndColumn(splitLoc).first;
820e7edcfeSLei Zhang auto subMemBuffer = llvm::MemoryBuffer::getMemBufferCopy(
83a6d76cf6SMehdi Amini subBuffer, Twine("within split at ") +
84a6d76cf6SMehdi Amini origMemBuffer->getBufferIdentifier() + ":" +
85a6d76cf6SMehdi Amini Twine(splitLine) + " offset ");
860e7edcfeSLei Zhang if (failed(processChunkBuffer(std::move(subMemBuffer), os)))
870e7edcfeSLei Zhang hadFailure = true;
889560f021SRiver Riddle };
899560f021SRiver Riddle llvm::interleave(sourceBuffers, os, interleaveFn,
90*516ccce7SIngo Müller (llvm::Twine(outputSplitMarker) + "\n").str());
910e7edcfeSLei Zhang
920e7edcfeSLei Zhang // If any fails, then return a failure of the tool.
930e7edcfeSLei Zhang return failure(hadFailure);
940e7edcfeSLei Zhang }
95