1 //===- SourceMgr.cpp - Manager for Simple Source Buffers & Diagnostics ----===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the SourceMgr class.  This class is used as a simple
10 // substrate for diagnostics, #include handling, and other low level things for
11 // simple parsers.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "llvm/Support/SourceMgr.h"
16 #include "llvm/ADT/ArrayRef.h"
17 #include "llvm/ADT/STLExtras.h"
18 #include "llvm/ADT/SmallVector.h"
19 #include "llvm/ADT/StringRef.h"
20 #include "llvm/ADT/Twine.h"
21 #include "llvm/Support/ErrorOr.h"
22 #include "llvm/Support/Locale.h"
23 #include "llvm/Support/MemoryBuffer.h"
24 #include "llvm/Support/Path.h"
25 #include "llvm/Support/SMLoc.h"
26 #include "llvm/Support/WithColor.h"
27 #include "llvm/Support/raw_ostream.h"
28 #include <algorithm>
29 #include <cassert>
30 #include <cstddef>
31 #include <limits>
32 #include <memory>
33 #include <string>
34 #include <utility>
35 
36 using namespace llvm;
37 
38 static const size_t TabStop = 8;
39 
AddIncludeFile(const std::string & Filename,SMLoc IncludeLoc,std::string & IncludedFile)40 unsigned SourceMgr::AddIncludeFile(const std::string &Filename,
41                                    SMLoc IncludeLoc,
42                                    std::string &IncludedFile) {
43   IncludedFile = Filename;
44   ErrorOr<std::unique_ptr<MemoryBuffer>> NewBufOrErr =
45       MemoryBuffer::getFile(IncludedFile);
46 
47   // If the file didn't exist directly, see if it's in an include path.
48   for (unsigned i = 0, e = IncludeDirectories.size(); i != e && !NewBufOrErr;
49        ++i) {
50     IncludedFile =
51         IncludeDirectories[i] + sys::path::get_separator().data() + Filename;
52     NewBufOrErr = MemoryBuffer::getFile(IncludedFile);
53   }
54 
55   if (!NewBufOrErr)
56     return 0;
57 
58   return AddNewSourceBuffer(std::move(*NewBufOrErr), IncludeLoc);
59 }
60 
FindBufferContainingLoc(SMLoc Loc) const61 unsigned SourceMgr::FindBufferContainingLoc(SMLoc Loc) const {
62   for (unsigned i = 0, e = Buffers.size(); i != e; ++i)
63     if (Loc.getPointer() >= Buffers[i].Buffer->getBufferStart() &&
64         // Use <= here so that a pointer to the null at the end of the buffer
65         // is included as part of the buffer.
66         Loc.getPointer() <= Buffers[i].Buffer->getBufferEnd())
67       return i + 1;
68   return 0;
69 }
70 
71 template <typename T>
GetOrCreateOffsetCache(void * & OffsetCache,MemoryBuffer * Buffer)72 static std::vector<T> &GetOrCreateOffsetCache(void *&OffsetCache,
73                                               MemoryBuffer *Buffer) {
74   if (OffsetCache)
75     return *static_cast<std::vector<T> *>(OffsetCache);
76 
77   // Lazily fill in the offset cache.
78   auto *Offsets = new std::vector<T>();
79   size_t Sz = Buffer->getBufferSize();
80   assert(Sz <= std::numeric_limits<T>::max());
81   StringRef S = Buffer->getBuffer();
82   for (size_t N = 0; N < Sz; ++N) {
83     if (S[N] == '\n')
84       Offsets->push_back(static_cast<T>(N));
85   }
86 
87   OffsetCache = Offsets;
88   return *Offsets;
89 }
90 
91 template <typename T>
getLineNumberSpecialized(const char * Ptr) const92 unsigned SourceMgr::SrcBuffer::getLineNumberSpecialized(const char *Ptr) const {
93   std::vector<T> &Offsets =
94       GetOrCreateOffsetCache<T>(OffsetCache, Buffer.get());
95 
96   const char *BufStart = Buffer->getBufferStart();
97   assert(Ptr >= BufStart && Ptr <= Buffer->getBufferEnd());
98   ptrdiff_t PtrDiff = Ptr - BufStart;
99   assert(PtrDiff >= 0 &&
100          static_cast<size_t>(PtrDiff) <= std::numeric_limits<T>::max());
101   T PtrOffset = static_cast<T>(PtrDiff);
102 
103   // llvm::lower_bound gives the number of EOL before PtrOffset. Add 1 to get
104   // the line number.
105   return llvm::lower_bound(Offsets, PtrOffset) - Offsets.begin() + 1;
106 }
107 
108 /// Look up a given \p Ptr in in the buffer, determining which line it came
109 /// from.
getLineNumber(const char * Ptr) const110 unsigned SourceMgr::SrcBuffer::getLineNumber(const char *Ptr) const {
111   size_t Sz = Buffer->getBufferSize();
112   if (Sz <= std::numeric_limits<uint8_t>::max())
113     return getLineNumberSpecialized<uint8_t>(Ptr);
114   else if (Sz <= std::numeric_limits<uint16_t>::max())
115     return getLineNumberSpecialized<uint16_t>(Ptr);
116   else if (Sz <= std::numeric_limits<uint32_t>::max())
117     return getLineNumberSpecialized<uint32_t>(Ptr);
118   else
119     return getLineNumberSpecialized<uint64_t>(Ptr);
120 }
121 
122 template <typename T>
getPointerForLineNumberSpecialized(unsigned LineNo) const123 const char *SourceMgr::SrcBuffer::getPointerForLineNumberSpecialized(
124     unsigned LineNo) const {
125   std::vector<T> &Offsets =
126       GetOrCreateOffsetCache<T>(OffsetCache, Buffer.get());
127 
128   // We start counting line and column numbers from 1.
129   if (LineNo != 0)
130     --LineNo;
131 
132   const char *BufStart = Buffer->getBufferStart();
133 
134   // The offset cache contains the location of the \n for the specified line,
135   // we want the start of the line.  As such, we look for the previous entry.
136   if (LineNo == 0)
137     return BufStart;
138   if (LineNo > Offsets.size())
139     return nullptr;
140   return BufStart + Offsets[LineNo - 1] + 1;
141 }
142 
143 /// Return a pointer to the first character of the specified line number or
144 /// null if the line number is invalid.
145 const char *
getPointerForLineNumber(unsigned LineNo) const146 SourceMgr::SrcBuffer::getPointerForLineNumber(unsigned LineNo) const {
147   size_t Sz = Buffer->getBufferSize();
148   if (Sz <= std::numeric_limits<uint8_t>::max())
149     return getPointerForLineNumberSpecialized<uint8_t>(LineNo);
150   else if (Sz <= std::numeric_limits<uint16_t>::max())
151     return getPointerForLineNumberSpecialized<uint16_t>(LineNo);
152   else if (Sz <= std::numeric_limits<uint32_t>::max())
153     return getPointerForLineNumberSpecialized<uint32_t>(LineNo);
154   else
155     return getPointerForLineNumberSpecialized<uint64_t>(LineNo);
156 }
157 
SrcBuffer(SourceMgr::SrcBuffer && Other)158 SourceMgr::SrcBuffer::SrcBuffer(SourceMgr::SrcBuffer &&Other)
159     : Buffer(std::move(Other.Buffer)), OffsetCache(Other.OffsetCache),
160       IncludeLoc(Other.IncludeLoc) {
161   Other.OffsetCache = nullptr;
162 }
163 
~SrcBuffer()164 SourceMgr::SrcBuffer::~SrcBuffer() {
165   if (OffsetCache) {
166     size_t Sz = Buffer->getBufferSize();
167     if (Sz <= std::numeric_limits<uint8_t>::max())
168       delete static_cast<std::vector<uint8_t> *>(OffsetCache);
169     else if (Sz <= std::numeric_limits<uint16_t>::max())
170       delete static_cast<std::vector<uint16_t> *>(OffsetCache);
171     else if (Sz <= std::numeric_limits<uint32_t>::max())
172       delete static_cast<std::vector<uint32_t> *>(OffsetCache);
173     else
174       delete static_cast<std::vector<uint64_t> *>(OffsetCache);
175     OffsetCache = nullptr;
176   }
177 }
178 
179 std::pair<unsigned, unsigned>
getLineAndColumn(SMLoc Loc,unsigned BufferID) const180 SourceMgr::getLineAndColumn(SMLoc Loc, unsigned BufferID) const {
181   if (!BufferID)
182     BufferID = FindBufferContainingLoc(Loc);
183   assert(BufferID && "Invalid location!");
184 
185   auto &SB = getBufferInfo(BufferID);
186   const char *Ptr = Loc.getPointer();
187 
188   unsigned LineNo = SB.getLineNumber(Ptr);
189   const char *BufStart = SB.Buffer->getBufferStart();
190   size_t NewlineOffs = StringRef(BufStart, Ptr - BufStart).find_last_of("\n\r");
191   if (NewlineOffs == StringRef::npos)
192     NewlineOffs = ~(size_t)0;
193   return std::make_pair(LineNo, Ptr - BufStart - NewlineOffs);
194 }
195 
196 // FIXME: Note that the formatting of source locations is spread between
197 // multiple functions, some in SourceMgr and some in SMDiagnostic. A better
198 // solution would be a general-purpose source location formatter
199 // in one of those two classes, or possibly in SMLoc.
200 
201 /// Get a string with the source location formatted in the standard
202 /// style, but without the line offset. If \p IncludePath is true, the path
203 /// is included. If false, only the file name and extension are included.
getFormattedLocationNoOffset(SMLoc Loc,bool IncludePath) const204 std::string SourceMgr::getFormattedLocationNoOffset(SMLoc Loc,
205                                                     bool IncludePath) const {
206   auto BufferID = FindBufferContainingLoc(Loc);
207   assert(BufferID && "Invalid location!");
208   auto FileSpec = getBufferInfo(BufferID).Buffer->getBufferIdentifier();
209 
210   if (IncludePath) {
211     return FileSpec.str() + ":" + std::to_string(FindLineNumber(Loc, BufferID));
212   } else {
213     auto I = FileSpec.find_last_of("/\\");
214     I = (I == FileSpec.size()) ? 0 : (I + 1);
215     return FileSpec.substr(I).str() + ":" +
216            std::to_string(FindLineNumber(Loc, BufferID));
217   }
218 }
219 
220 /// Given a line and column number in a mapped buffer, turn it into an SMLoc.
221 /// This will return a null SMLoc if the line/column location is invalid.
FindLocForLineAndColumn(unsigned BufferID,unsigned LineNo,unsigned ColNo)222 SMLoc SourceMgr::FindLocForLineAndColumn(unsigned BufferID, unsigned LineNo,
223                                          unsigned ColNo) {
224   auto &SB = getBufferInfo(BufferID);
225   const char *Ptr = SB.getPointerForLineNumber(LineNo);
226   if (!Ptr)
227     return SMLoc();
228 
229   // We start counting line and column numbers from 1.
230   if (ColNo != 0)
231     --ColNo;
232 
233   // If we have a column number, validate it.
234   if (ColNo) {
235     // Make sure the location is within the current line.
236     if (Ptr + ColNo > SB.Buffer->getBufferEnd())
237       return SMLoc();
238 
239     // Make sure there is no newline in the way.
240     if (StringRef(Ptr, ColNo).find_first_of("\n\r") != StringRef::npos)
241       return SMLoc();
242 
243     Ptr += ColNo;
244   }
245 
246   return SMLoc::getFromPointer(Ptr);
247 }
248 
PrintIncludeStack(SMLoc IncludeLoc,raw_ostream & OS) const249 void SourceMgr::PrintIncludeStack(SMLoc IncludeLoc, raw_ostream &OS) const {
250   if (IncludeLoc == SMLoc())
251     return; // Top of stack.
252 
253   unsigned CurBuf = FindBufferContainingLoc(IncludeLoc);
254   assert(CurBuf && "Invalid or unspecified location!");
255 
256   PrintIncludeStack(getBufferInfo(CurBuf).IncludeLoc, OS);
257 
258   OS << "Included from " << getBufferInfo(CurBuf).Buffer->getBufferIdentifier()
259      << ":" << FindLineNumber(IncludeLoc, CurBuf) << ":\n";
260 }
261 
GetMessage(SMLoc Loc,SourceMgr::DiagKind Kind,const Twine & Msg,ArrayRef<SMRange> Ranges,ArrayRef<SMFixIt> FixIts) const262 SMDiagnostic SourceMgr::GetMessage(SMLoc Loc, SourceMgr::DiagKind Kind,
263                                    const Twine &Msg, ArrayRef<SMRange> Ranges,
264                                    ArrayRef<SMFixIt> FixIts) const {
265   // First thing to do: find the current buffer containing the specified
266   // location to pull out the source line.
267   SmallVector<std::pair<unsigned, unsigned>, 4> ColRanges;
268   std::pair<unsigned, unsigned> LineAndCol;
269   StringRef BufferID = "<unknown>";
270   std::string LineStr;
271 
272   if (Loc.isValid()) {
273     unsigned CurBuf = FindBufferContainingLoc(Loc);
274     assert(CurBuf && "Invalid or unspecified location!");
275 
276     const MemoryBuffer *CurMB = getMemoryBuffer(CurBuf);
277     BufferID = CurMB->getBufferIdentifier();
278 
279     // Scan backward to find the start of the line.
280     const char *LineStart = Loc.getPointer();
281     const char *BufStart = CurMB->getBufferStart();
282     while (LineStart != BufStart && LineStart[-1] != '\n' &&
283            LineStart[-1] != '\r')
284       --LineStart;
285 
286     // Get the end of the line.
287     const char *LineEnd = Loc.getPointer();
288     const char *BufEnd = CurMB->getBufferEnd();
289     while (LineEnd != BufEnd && LineEnd[0] != '\n' && LineEnd[0] != '\r')
290       ++LineEnd;
291     LineStr = std::string(LineStart, LineEnd);
292 
293     // Convert any ranges to column ranges that only intersect the line of the
294     // location.
295     for (unsigned i = 0, e = Ranges.size(); i != e; ++i) {
296       SMRange R = Ranges[i];
297       if (!R.isValid())
298         continue;
299 
300       // If the line doesn't contain any part of the range, then ignore it.
301       if (R.Start.getPointer() > LineEnd || R.End.getPointer() < LineStart)
302         continue;
303 
304       // Ignore pieces of the range that go onto other lines.
305       if (R.Start.getPointer() < LineStart)
306         R.Start = SMLoc::getFromPointer(LineStart);
307       if (R.End.getPointer() > LineEnd)
308         R.End = SMLoc::getFromPointer(LineEnd);
309 
310       // Translate from SMLoc ranges to column ranges.
311       // FIXME: Handle multibyte characters.
312       ColRanges.push_back(std::make_pair(R.Start.getPointer() - LineStart,
313                                          R.End.getPointer() - LineStart));
314     }
315 
316     LineAndCol = getLineAndColumn(Loc, CurBuf);
317   }
318 
319   return SMDiagnostic(*this, Loc, BufferID, LineAndCol.first,
320                       LineAndCol.second - 1, Kind, Msg.str(), LineStr,
321                       ColRanges, FixIts);
322 }
323 
PrintMessage(raw_ostream & OS,const SMDiagnostic & Diagnostic,bool ShowColors) const324 void SourceMgr::PrintMessage(raw_ostream &OS, const SMDiagnostic &Diagnostic,
325                              bool ShowColors) const {
326   // Report the message with the diagnostic handler if present.
327   if (DiagHandler) {
328     DiagHandler(Diagnostic, DiagContext);
329     return;
330   }
331 
332   if (Diagnostic.getLoc().isValid()) {
333     unsigned CurBuf = FindBufferContainingLoc(Diagnostic.getLoc());
334     assert(CurBuf && "Invalid or unspecified location!");
335     PrintIncludeStack(getBufferInfo(CurBuf).IncludeLoc, OS);
336   }
337 
338   Diagnostic.print(nullptr, OS, ShowColors);
339 }
340 
PrintMessage(raw_ostream & OS,SMLoc Loc,SourceMgr::DiagKind Kind,const Twine & Msg,ArrayRef<SMRange> Ranges,ArrayRef<SMFixIt> FixIts,bool ShowColors) const341 void SourceMgr::PrintMessage(raw_ostream &OS, SMLoc Loc,
342                              SourceMgr::DiagKind Kind, const Twine &Msg,
343                              ArrayRef<SMRange> Ranges, ArrayRef<SMFixIt> FixIts,
344                              bool ShowColors) const {
345   PrintMessage(OS, GetMessage(Loc, Kind, Msg, Ranges, FixIts), ShowColors);
346 }
347 
PrintMessage(SMLoc Loc,SourceMgr::DiagKind Kind,const Twine & Msg,ArrayRef<SMRange> Ranges,ArrayRef<SMFixIt> FixIts,bool ShowColors) const348 void SourceMgr::PrintMessage(SMLoc Loc, SourceMgr::DiagKind Kind,
349                              const Twine &Msg, ArrayRef<SMRange> Ranges,
350                              ArrayRef<SMFixIt> FixIts, bool ShowColors) const {
351   PrintMessage(errs(), Loc, Kind, Msg, Ranges, FixIts, ShowColors);
352 }
353 
354 //===----------------------------------------------------------------------===//
355 // SMFixIt Implementation
356 //===----------------------------------------------------------------------===//
357 
SMFixIt(SMRange R,const Twine & Replacement)358 SMFixIt::SMFixIt(SMRange R, const Twine &Replacement)
359     : Range(R), Text(Replacement.str()) {
360   assert(R.isValid());
361 }
362 
363 //===----------------------------------------------------------------------===//
364 // SMDiagnostic Implementation
365 //===----------------------------------------------------------------------===//
366 
SMDiagnostic(const SourceMgr & sm,SMLoc L,StringRef FN,int Line,int Col,SourceMgr::DiagKind Kind,StringRef Msg,StringRef LineStr,ArrayRef<std::pair<unsigned,unsigned>> Ranges,ArrayRef<SMFixIt> Hints)367 SMDiagnostic::SMDiagnostic(const SourceMgr &sm, SMLoc L, StringRef FN, int Line,
368                            int Col, SourceMgr::DiagKind Kind, StringRef Msg,
369                            StringRef LineStr,
370                            ArrayRef<std::pair<unsigned, unsigned>> Ranges,
371                            ArrayRef<SMFixIt> Hints)
372     : SM(&sm), Loc(L), Filename(std::string(FN)), LineNo(Line), ColumnNo(Col),
373       Kind(Kind), Message(std::string(Msg)), LineContents(std::string(LineStr)),
374       Ranges(Ranges.vec()), FixIts(Hints.begin(), Hints.end()) {
375   llvm::sort(FixIts);
376 }
377 
buildFixItLine(std::string & CaretLine,std::string & FixItLine,ArrayRef<SMFixIt> FixIts,ArrayRef<char> SourceLine)378 static void buildFixItLine(std::string &CaretLine, std::string &FixItLine,
379                            ArrayRef<SMFixIt> FixIts,
380                            ArrayRef<char> SourceLine) {
381   if (FixIts.empty())
382     return;
383 
384   const char *LineStart = SourceLine.begin();
385   const char *LineEnd = SourceLine.end();
386 
387   size_t PrevHintEndCol = 0;
388 
389   for (ArrayRef<SMFixIt>::iterator I = FixIts.begin(), E = FixIts.end(); I != E;
390        ++I) {
391     // If the fixit contains a newline or tab, ignore it.
392     if (I->getText().find_first_of("\n\r\t") != StringRef::npos)
393       continue;
394 
395     SMRange R = I->getRange();
396 
397     // If the line doesn't contain any part of the range, then ignore it.
398     if (R.Start.getPointer() > LineEnd || R.End.getPointer() < LineStart)
399       continue;
400 
401     // Translate from SMLoc to column.
402     // Ignore pieces of the range that go onto other lines.
403     // FIXME: Handle multibyte characters in the source line.
404     unsigned FirstCol;
405     if (R.Start.getPointer() < LineStart)
406       FirstCol = 0;
407     else
408       FirstCol = R.Start.getPointer() - LineStart;
409 
410     // If we inserted a long previous hint, push this one forwards, and add
411     // an extra space to show that this is not part of the previous
412     // completion. This is sort of the best we can do when two hints appear
413     // to overlap.
414     //
415     // Note that if this hint is located immediately after the previous
416     // hint, no space will be added, since the location is more important.
417     unsigned HintCol = FirstCol;
418     if (HintCol < PrevHintEndCol)
419       HintCol = PrevHintEndCol + 1;
420 
421     // FIXME: This assertion is intended to catch unintended use of multibyte
422     // characters in fixits. If we decide to do this, we'll have to track
423     // separate byte widths for the source and fixit lines.
424     assert((size_t)sys::locale::columnWidth(I->getText()) ==
425            I->getText().size());
426 
427     // This relies on one byte per column in our fixit hints.
428     unsigned LastColumnModified = HintCol + I->getText().size();
429     if (LastColumnModified > FixItLine.size())
430       FixItLine.resize(LastColumnModified, ' ');
431 
432     std::copy(I->getText().begin(), I->getText().end(),
433               FixItLine.begin() + HintCol);
434 
435     PrevHintEndCol = LastColumnModified;
436 
437     // For replacements, mark the removal range with '~'.
438     // FIXME: Handle multibyte characters in the source line.
439     unsigned LastCol;
440     if (R.End.getPointer() >= LineEnd)
441       LastCol = LineEnd - LineStart;
442     else
443       LastCol = R.End.getPointer() - LineStart;
444 
445     std::fill(&CaretLine[FirstCol], &CaretLine[LastCol], '~');
446   }
447 }
448 
printSourceLine(raw_ostream & S,StringRef LineContents)449 static void printSourceLine(raw_ostream &S, StringRef LineContents) {
450   // Print out the source line one character at a time, so we can expand tabs.
451   for (unsigned i = 0, e = LineContents.size(), OutCol = 0; i != e; ++i) {
452     size_t NextTab = LineContents.find('\t', i);
453     // If there were no tabs left, print the rest, we are done.
454     if (NextTab == StringRef::npos) {
455       S << LineContents.drop_front(i);
456       break;
457     }
458 
459     // Otherwise, print from i to NextTab.
460     S << LineContents.slice(i, NextTab);
461     OutCol += NextTab - i;
462     i = NextTab;
463 
464     // If we have a tab, emit at least one space, then round up to 8 columns.
465     do {
466       S << ' ';
467       ++OutCol;
468     } while ((OutCol % TabStop) != 0);
469   }
470   S << '\n';
471 }
472 
isNonASCII(char c)473 static bool isNonASCII(char c) { return c & 0x80; }
474 
print(const char * ProgName,raw_ostream & OS,bool ShowColors,bool ShowKindLabel) const475 void SMDiagnostic::print(const char *ProgName, raw_ostream &OS, bool ShowColors,
476                          bool ShowKindLabel) const {
477   ColorMode Mode = ShowColors ? ColorMode::Auto : ColorMode::Disable;
478 
479   {
480     WithColor S(OS, raw_ostream::SAVEDCOLOR, true, false, Mode);
481 
482     if (ProgName && ProgName[0])
483       S << ProgName << ": ";
484 
485     if (!Filename.empty()) {
486       if (Filename == "-")
487         S << "<stdin>";
488       else
489         S << Filename;
490 
491       if (LineNo != -1) {
492         S << ':' << LineNo;
493         if (ColumnNo != -1)
494           S << ':' << (ColumnNo + 1);
495       }
496       S << ": ";
497     }
498   }
499 
500   if (ShowKindLabel) {
501     switch (Kind) {
502     case SourceMgr::DK_Error:
503       WithColor::error(OS, "", !ShowColors);
504       break;
505     case SourceMgr::DK_Warning:
506       WithColor::warning(OS, "", !ShowColors);
507       break;
508     case SourceMgr::DK_Note:
509       WithColor::note(OS, "", !ShowColors);
510       break;
511     case SourceMgr::DK_Remark:
512       WithColor::remark(OS, "", !ShowColors);
513       break;
514     }
515   }
516 
517   WithColor(OS, raw_ostream::SAVEDCOLOR, true, false, Mode) << Message << '\n';
518 
519   if (LineNo == -1 || ColumnNo == -1)
520     return;
521 
522   // FIXME: If there are multibyte or multi-column characters in the source, all
523   // our ranges will be wrong. To do this properly, we'll need a byte-to-column
524   // map like Clang's TextDiagnostic. For now, we'll just handle tabs by
525   // expanding them later, and bail out rather than show incorrect ranges and
526   // misaligned fixits for any other odd characters.
527   if (find_if(LineContents, isNonASCII) != LineContents.end()) {
528     printSourceLine(OS, LineContents);
529     return;
530   }
531   size_t NumColumns = LineContents.size();
532 
533   // Build the line with the caret and ranges.
534   std::string CaretLine(NumColumns + 1, ' ');
535 
536   // Expand any ranges.
537   for (unsigned r = 0, e = Ranges.size(); r != e; ++r) {
538     std::pair<unsigned, unsigned> R = Ranges[r];
539     std::fill(&CaretLine[R.first],
540               &CaretLine[std::min((size_t)R.second, CaretLine.size())], '~');
541   }
542 
543   // Add any fix-its.
544   // FIXME: Find the beginning of the line properly for multibyte characters.
545   std::string FixItInsertionLine;
546   buildFixItLine(
547       CaretLine, FixItInsertionLine, FixIts,
548       makeArrayRef(Loc.getPointer() - ColumnNo, LineContents.size()));
549 
550   // Finally, plop on the caret.
551   if (unsigned(ColumnNo) <= NumColumns)
552     CaretLine[ColumnNo] = '^';
553   else
554     CaretLine[NumColumns] = '^';
555 
556   // ... and remove trailing whitespace so the output doesn't wrap for it.  We
557   // know that the line isn't completely empty because it has the caret in it at
558   // least.
559   CaretLine.erase(CaretLine.find_last_not_of(' ') + 1);
560 
561   printSourceLine(OS, LineContents);
562 
563   {
564     ColorMode Mode = ShowColors ? ColorMode::Auto : ColorMode::Disable;
565     WithColor S(OS, raw_ostream::GREEN, true, false, Mode);
566 
567     // Print out the caret line, matching tabs in the source line.
568     for (unsigned i = 0, e = CaretLine.size(), OutCol = 0; i != e; ++i) {
569       if (i >= LineContents.size() || LineContents[i] != '\t') {
570         S << CaretLine[i];
571         ++OutCol;
572         continue;
573       }
574 
575       // Okay, we have a tab.  Insert the appropriate number of characters.
576       do {
577         S << CaretLine[i];
578         ++OutCol;
579       } while ((OutCol % TabStop) != 0);
580     }
581     S << '\n';
582   }
583 
584   // Print out the replacement line, matching tabs in the source line.
585   if (FixItInsertionLine.empty())
586     return;
587 
588   for (size_t i = 0, e = FixItInsertionLine.size(), OutCol = 0; i < e; ++i) {
589     if (i >= LineContents.size() || LineContents[i] != '\t') {
590       OS << FixItInsertionLine[i];
591       ++OutCol;
592       continue;
593     }
594 
595     // Okay, we have a tab.  Insert the appropriate number of characters.
596     do {
597       OS << FixItInsertionLine[i];
598       // FIXME: This is trying not to break up replacements, but then to re-sync
599       // with the tabs between replacements. This will fail, though, if two
600       // fix-it replacements are exactly adjacent, or if a fix-it contains a
601       // space. Really we should be precomputing column widths, which we'll
602       // need anyway for multibyte chars.
603       if (FixItInsertionLine[i] != ' ')
604         ++i;
605       ++OutCol;
606     } while (((OutCol % TabStop) != 0) && i != e);
607   }
608   OS << '\n';
609 }
610