CoverageMapping.cpp revision 327952
1321369Sdim//===- CoverageMapping.cpp - Code coverage mapping support ----------------===//
2303231Sdim//
3303231Sdim//                     The LLVM Compiler Infrastructure
4303231Sdim//
5303231Sdim// This file is distributed under the University of Illinois Open Source
6303231Sdim// License. See LICENSE.TXT for details.
7303231Sdim//
8303231Sdim//===----------------------------------------------------------------------===//
9303231Sdim//
10303231Sdim// This file contains support for clang's and llvm's instrumentation based
11303231Sdim// code coverage.
12303231Sdim//
13303231Sdim//===----------------------------------------------------------------------===//
14303231Sdim
15303231Sdim#include "llvm/ProfileData/Coverage/CoverageMapping.h"
16321369Sdim#include "llvm/ADT/ArrayRef.h"
17303231Sdim#include "llvm/ADT/DenseMap.h"
18321369Sdim#include "llvm/ADT/None.h"
19303231Sdim#include "llvm/ADT/Optional.h"
20303231Sdim#include "llvm/ADT/SmallBitVector.h"
21321369Sdim#include "llvm/ADT/SmallVector.h"
22321369Sdim#include "llvm/ADT/StringRef.h"
23303231Sdim#include "llvm/ProfileData/Coverage/CoverageMappingReader.h"
24303231Sdim#include "llvm/ProfileData/InstrProfReader.h"
25303231Sdim#include "llvm/Support/Debug.h"
26303231Sdim#include "llvm/Support/Errc.h"
27321369Sdim#include "llvm/Support/Error.h"
28303231Sdim#include "llvm/Support/ErrorHandling.h"
29303231Sdim#include "llvm/Support/ManagedStatic.h"
30321369Sdim#include "llvm/Support/MemoryBuffer.h"
31303231Sdim#include "llvm/Support/raw_ostream.h"
32321369Sdim#include <algorithm>
33321369Sdim#include <cassert>
34321369Sdim#include <cstdint>
35321369Sdim#include <iterator>
36327952Sdim#include <map>
37321369Sdim#include <memory>
38321369Sdim#include <string>
39321369Sdim#include <system_error>
40321369Sdim#include <utility>
41321369Sdim#include <vector>
42303231Sdim
43303231Sdimusing namespace llvm;
44303231Sdimusing namespace coverage;
45303231Sdim
46303231Sdim#define DEBUG_TYPE "coverage-mapping"
47303231Sdim
48303231SdimCounter CounterExpressionBuilder::get(const CounterExpression &E) {
49303231Sdim  auto It = ExpressionIndices.find(E);
50303231Sdim  if (It != ExpressionIndices.end())
51303231Sdim    return Counter::getExpression(It->second);
52303231Sdim  unsigned I = Expressions.size();
53303231Sdim  Expressions.push_back(E);
54303231Sdim  ExpressionIndices[E] = I;
55303231Sdim  return Counter::getExpression(I);
56303231Sdim}
57303231Sdim
58321369Sdimvoid CounterExpressionBuilder::extractTerms(Counter C, int Factor,
59321369Sdim                                            SmallVectorImpl<Term> &Terms) {
60303231Sdim  switch (C.getKind()) {
61303231Sdim  case Counter::Zero:
62303231Sdim    break;
63303231Sdim  case Counter::CounterValueReference:
64321369Sdim    Terms.emplace_back(C.getCounterID(), Factor);
65303231Sdim    break;
66303231Sdim  case Counter::Expression:
67303231Sdim    const auto &E = Expressions[C.getExpressionID()];
68321369Sdim    extractTerms(E.LHS, Factor, Terms);
69321369Sdim    extractTerms(
70321369Sdim        E.RHS, E.Kind == CounterExpression::Subtract ? -Factor : Factor, Terms);
71303231Sdim    break;
72303231Sdim  }
73303231Sdim}
74303231Sdim
75303231SdimCounter CounterExpressionBuilder::simplify(Counter ExpressionTree) {
76303231Sdim  // Gather constant terms.
77321369Sdim  SmallVector<Term, 32> Terms;
78303231Sdim  extractTerms(ExpressionTree, +1, Terms);
79303231Sdim
80303231Sdim  // If there are no terms, this is just a zero. The algorithm below assumes at
81303231Sdim  // least one term.
82303231Sdim  if (Terms.size() == 0)
83303231Sdim    return Counter::getZero();
84303231Sdim
85303231Sdim  // Group the terms by counter ID.
86321369Sdim  std::sort(Terms.begin(), Terms.end(), [](const Term &LHS, const Term &RHS) {
87321369Sdim    return LHS.CounterID < RHS.CounterID;
88303231Sdim  });
89303231Sdim
90303231Sdim  // Combine terms by counter ID to eliminate counters that sum to zero.
91303231Sdim  auto Prev = Terms.begin();
92303231Sdim  for (auto I = Prev + 1, E = Terms.end(); I != E; ++I) {
93321369Sdim    if (I->CounterID == Prev->CounterID) {
94321369Sdim      Prev->Factor += I->Factor;
95303231Sdim      continue;
96303231Sdim    }
97303231Sdim    ++Prev;
98303231Sdim    *Prev = *I;
99303231Sdim  }
100303231Sdim  Terms.erase(++Prev, Terms.end());
101303231Sdim
102303231Sdim  Counter C;
103303231Sdim  // Create additions. We do this before subtractions to avoid constructs like
104303231Sdim  // ((0 - X) + Y), as opposed to (Y - X).
105321369Sdim  for (auto T : Terms) {
106321369Sdim    if (T.Factor <= 0)
107303231Sdim      continue;
108321369Sdim    for (int I = 0; I < T.Factor; ++I)
109303231Sdim      if (C.isZero())
110321369Sdim        C = Counter::getCounter(T.CounterID);
111303231Sdim      else
112303231Sdim        C = get(CounterExpression(CounterExpression::Add, C,
113321369Sdim                                  Counter::getCounter(T.CounterID)));
114303231Sdim  }
115303231Sdim
116303231Sdim  // Create subtractions.
117321369Sdim  for (auto T : Terms) {
118321369Sdim    if (T.Factor >= 0)
119303231Sdim      continue;
120321369Sdim    for (int I = 0; I < -T.Factor; ++I)
121303231Sdim      C = get(CounterExpression(CounterExpression::Subtract, C,
122321369Sdim                                Counter::getCounter(T.CounterID)));
123303231Sdim  }
124303231Sdim  return C;
125303231Sdim}
126303231Sdim
127303231SdimCounter CounterExpressionBuilder::add(Counter LHS, Counter RHS) {
128303231Sdim  return simplify(get(CounterExpression(CounterExpression::Add, LHS, RHS)));
129303231Sdim}
130303231Sdim
131303231SdimCounter CounterExpressionBuilder::subtract(Counter LHS, Counter RHS) {
132303231Sdim  return simplify(
133303231Sdim      get(CounterExpression(CounterExpression::Subtract, LHS, RHS)));
134303231Sdim}
135303231Sdim
136321369Sdimvoid CounterMappingContext::dump(const Counter &C, raw_ostream &OS) const {
137303231Sdim  switch (C.getKind()) {
138303231Sdim  case Counter::Zero:
139303231Sdim    OS << '0';
140303231Sdim    return;
141303231Sdim  case Counter::CounterValueReference:
142303231Sdim    OS << '#' << C.getCounterID();
143303231Sdim    break;
144303231Sdim  case Counter::Expression: {
145303231Sdim    if (C.getExpressionID() >= Expressions.size())
146303231Sdim      return;
147303231Sdim    const auto &E = Expressions[C.getExpressionID()];
148303231Sdim    OS << '(';
149303231Sdim    dump(E.LHS, OS);
150303231Sdim    OS << (E.Kind == CounterExpression::Subtract ? " - " : " + ");
151303231Sdim    dump(E.RHS, OS);
152303231Sdim    OS << ')';
153303231Sdim    break;
154303231Sdim  }
155303231Sdim  }
156303231Sdim  if (CounterValues.empty())
157303231Sdim    return;
158303231Sdim  Expected<int64_t> Value = evaluate(C);
159303231Sdim  if (auto E = Value.takeError()) {
160321369Sdim    consumeError(std::move(E));
161303231Sdim    return;
162303231Sdim  }
163303231Sdim  OS << '[' << *Value << ']';
164303231Sdim}
165303231Sdim
166303231SdimExpected<int64_t> CounterMappingContext::evaluate(const Counter &C) const {
167303231Sdim  switch (C.getKind()) {
168303231Sdim  case Counter::Zero:
169303231Sdim    return 0;
170303231Sdim  case Counter::CounterValueReference:
171303231Sdim    if (C.getCounterID() >= CounterValues.size())
172303231Sdim      return errorCodeToError(errc::argument_out_of_domain);
173303231Sdim    return CounterValues[C.getCounterID()];
174303231Sdim  case Counter::Expression: {
175303231Sdim    if (C.getExpressionID() >= Expressions.size())
176303231Sdim      return errorCodeToError(errc::argument_out_of_domain);
177303231Sdim    const auto &E = Expressions[C.getExpressionID()];
178303231Sdim    Expected<int64_t> LHS = evaluate(E.LHS);
179303231Sdim    if (!LHS)
180303231Sdim      return LHS;
181303231Sdim    Expected<int64_t> RHS = evaluate(E.RHS);
182303231Sdim    if (!RHS)
183303231Sdim      return RHS;
184303231Sdim    return E.Kind == CounterExpression::Subtract ? *LHS - *RHS : *LHS + *RHS;
185303231Sdim  }
186303231Sdim  }
187303231Sdim  llvm_unreachable("Unhandled CounterKind");
188303231Sdim}
189303231Sdim
190303231Sdimvoid FunctionRecordIterator::skipOtherFiles() {
191303231Sdim  while (Current != Records.end() && !Filename.empty() &&
192303231Sdim         Filename != Current->Filenames[0])
193303231Sdim    ++Current;
194303231Sdim  if (Current == Records.end())
195303231Sdim    *this = FunctionRecordIterator();
196303231Sdim}
197303231Sdim
198314564SdimError CoverageMapping::loadFunctionRecord(
199314564Sdim    const CoverageMappingRecord &Record,
200314564Sdim    IndexedInstrProfReader &ProfileReader) {
201314564Sdim  StringRef OrigFuncName = Record.FunctionName;
202321369Sdim  if (OrigFuncName.empty())
203321369Sdim    return make_error<CoverageMapError>(coveragemap_error::malformed);
204321369Sdim
205314564Sdim  if (Record.Filenames.empty())
206314564Sdim    OrigFuncName = getFuncNameWithoutPrefix(OrigFuncName);
207314564Sdim  else
208314564Sdim    OrigFuncName = getFuncNameWithoutPrefix(OrigFuncName, Record.Filenames[0]);
209314564Sdim
210314564Sdim  // Don't load records for functions we've already seen.
211314564Sdim  if (!FunctionNames.insert(OrigFuncName).second)
212314564Sdim    return Error::success();
213314564Sdim
214314564Sdim  CounterMappingContext Ctx(Record.Expressions);
215314564Sdim
216314564Sdim  std::vector<uint64_t> Counts;
217314564Sdim  if (Error E = ProfileReader.getFunctionCounts(Record.FunctionName,
218314564Sdim                                                Record.FunctionHash, Counts)) {
219314564Sdim    instrprof_error IPE = InstrProfError::take(std::move(E));
220314564Sdim    if (IPE == instrprof_error::hash_mismatch) {
221327952Sdim      FuncHashMismatches.emplace_back(Record.FunctionName, Record.FunctionHash);
222314564Sdim      return Error::success();
223314564Sdim    } else if (IPE != instrprof_error::unknown_function)
224314564Sdim      return make_error<InstrProfError>(IPE);
225314564Sdim    Counts.assign(Record.MappingRegions.size(), 0);
226314564Sdim  }
227314564Sdim  Ctx.setCounts(Counts);
228314564Sdim
229314564Sdim  assert(!Record.MappingRegions.empty() && "Function has no regions");
230314564Sdim
231314564Sdim  FunctionRecord Function(OrigFuncName, Record.Filenames);
232314564Sdim  for (const auto &Region : Record.MappingRegions) {
233314564Sdim    Expected<int64_t> ExecutionCount = Ctx.evaluate(Region.Count);
234314564Sdim    if (auto E = ExecutionCount.takeError()) {
235321369Sdim      consumeError(std::move(E));
236314564Sdim      return Error::success();
237314564Sdim    }
238314564Sdim    Function.pushRegion(Region, *ExecutionCount);
239314564Sdim  }
240314564Sdim  if (Function.CountedRegions.size() != Record.MappingRegions.size()) {
241327952Sdim    FuncCounterMismatches.emplace_back(Record.FunctionName,
242327952Sdim                                       Function.CountedRegions.size());
243314564Sdim    return Error::success();
244314564Sdim  }
245314564Sdim
246314564Sdim  Functions.push_back(std::move(Function));
247314564Sdim  return Error::success();
248314564Sdim}
249314564Sdim
250314564SdimExpected<std::unique_ptr<CoverageMapping>> CoverageMapping::load(
251314564Sdim    ArrayRef<std::unique_ptr<CoverageMappingReader>> CoverageReaders,
252314564Sdim    IndexedInstrProfReader &ProfileReader) {
253314564Sdim  auto Coverage = std::unique_ptr<CoverageMapping>(new CoverageMapping());
254303231Sdim
255327952Sdim  for (const auto &CoverageReader : CoverageReaders) {
256327952Sdim    for (auto RecordOrErr : *CoverageReader) {
257327952Sdim      if (Error E = RecordOrErr.takeError())
258327952Sdim        return std::move(E);
259327952Sdim      const auto &Record = *RecordOrErr;
260314564Sdim      if (Error E = Coverage->loadFunctionRecord(Record, ProfileReader))
261314564Sdim        return std::move(E);
262327952Sdim    }
263327952Sdim  }
264303231Sdim
265303231Sdim  return std::move(Coverage);
266303231Sdim}
267303231Sdim
268303231SdimExpected<std::unique_ptr<CoverageMapping>>
269314564SdimCoverageMapping::load(ArrayRef<StringRef> ObjectFilenames,
270327952Sdim                      StringRef ProfileFilename, ArrayRef<StringRef> Arches) {
271303231Sdim  auto ProfileReaderOrErr = IndexedInstrProfReader::create(ProfileFilename);
272303231Sdim  if (Error E = ProfileReaderOrErr.takeError())
273303231Sdim    return std::move(E);
274303231Sdim  auto ProfileReader = std::move(ProfileReaderOrErr.get());
275314564Sdim
276314564Sdim  SmallVector<std::unique_ptr<CoverageMappingReader>, 4> Readers;
277314564Sdim  SmallVector<std::unique_ptr<MemoryBuffer>, 4> Buffers;
278327952Sdim  for (const auto &File : llvm::enumerate(ObjectFilenames)) {
279327952Sdim    auto CovMappingBufOrErr = MemoryBuffer::getFileOrSTDIN(File.value());
280314564Sdim    if (std::error_code EC = CovMappingBufOrErr.getError())
281314564Sdim      return errorCodeToError(EC);
282327952Sdim    StringRef Arch = Arches.empty() ? StringRef() : Arches[File.index()];
283314564Sdim    auto CoverageReaderOrErr =
284314564Sdim        BinaryCoverageReader::create(CovMappingBufOrErr.get(), Arch);
285314564Sdim    if (Error E = CoverageReaderOrErr.takeError())
286314564Sdim      return std::move(E);
287314564Sdim    Readers.push_back(std::move(CoverageReaderOrErr.get()));
288314564Sdim    Buffers.push_back(std::move(CovMappingBufOrErr.get()));
289314564Sdim  }
290314564Sdim  return load(Readers, *ProfileReader);
291303231Sdim}
292303231Sdim
293303231Sdimnamespace {
294321369Sdim
295303231Sdim/// \brief Distributes functions into instantiation sets.
296303231Sdim///
297303231Sdim/// An instantiation set is a collection of functions that have the same source
298303231Sdim/// code, ie, template functions specializations.
299303231Sdimclass FunctionInstantiationSetCollector {
300327952Sdim  using MapT = std::map<LineColPair, std::vector<const FunctionRecord *>>;
301303231Sdim  MapT InstantiatedFunctions;
302303231Sdim
303303231Sdimpublic:
304303231Sdim  void insert(const FunctionRecord &Function, unsigned FileID) {
305303231Sdim    auto I = Function.CountedRegions.begin(), E = Function.CountedRegions.end();
306303231Sdim    while (I != E && I->FileID != FileID)
307303231Sdim      ++I;
308303231Sdim    assert(I != E && "function does not cover the given file");
309303231Sdim    auto &Functions = InstantiatedFunctions[I->startLoc()];
310303231Sdim    Functions.push_back(&Function);
311303231Sdim  }
312303231Sdim
313303231Sdim  MapT::iterator begin() { return InstantiatedFunctions.begin(); }
314303231Sdim  MapT::iterator end() { return InstantiatedFunctions.end(); }
315303231Sdim};
316303231Sdim
317303231Sdimclass SegmentBuilder {
318303231Sdim  std::vector<CoverageSegment> &Segments;
319303231Sdim  SmallVector<const CountedRegion *, 8> ActiveRegions;
320303231Sdim
321303231Sdim  SegmentBuilder(std::vector<CoverageSegment> &Segments) : Segments(Segments) {}
322303231Sdim
323327952Sdim  /// Emit a segment with the count from \p Region starting at \p StartLoc.
324327952Sdim  //
325327952Sdim  /// \p IsRegionEntry: The segment is at the start of a new non-gap region.
326327952Sdim  /// \p EmitSkippedRegion: The segment must be emitted as a skipped region.
327327952Sdim  void startSegment(const CountedRegion &Region, LineColPair StartLoc,
328327952Sdim                    bool IsRegionEntry, bool EmitSkippedRegion = false) {
329327952Sdim    bool HasCount = !EmitSkippedRegion &&
330327952Sdim                    (Region.Kind != CounterMappingRegion::SkippedRegion);
331303231Sdim
332327952Sdim    // If the new segment wouldn't affect coverage rendering, skip it.
333327952Sdim    if (!Segments.empty() && !IsRegionEntry && !EmitSkippedRegion) {
334327952Sdim      const auto &Last = Segments.back();
335327952Sdim      if (Last.HasCount == HasCount && Last.Count == Region.ExecutionCount &&
336327952Sdim          !Last.IsRegionEntry)
337327952Sdim        return;
338327952Sdim    }
339303231Sdim
340327952Sdim    if (HasCount)
341327952Sdim      Segments.emplace_back(StartLoc.first, StartLoc.second,
342327952Sdim                            Region.ExecutionCount, IsRegionEntry,
343327952Sdim                            Region.Kind == CounterMappingRegion::GapRegion);
344327952Sdim    else
345327952Sdim      Segments.emplace_back(StartLoc.first, StartLoc.second, IsRegionEntry);
346327952Sdim
347327952Sdim    DEBUG({
348327952Sdim      const auto &Last = Segments.back();
349327952Sdim      dbgs() << "Segment at " << Last.Line << ":" << Last.Col
350327952Sdim             << " (count = " << Last.Count << ")"
351327952Sdim             << (Last.IsRegionEntry ? ", RegionEntry" : "")
352327952Sdim             << (!Last.HasCount ? ", Skipped" : "")
353327952Sdim             << (Last.IsGapRegion ? ", Gap" : "") << "\n";
354327952Sdim    });
355303231Sdim  }
356303231Sdim
357327952Sdim  /// Emit segments for active regions which end before \p Loc.
358327952Sdim  ///
359327952Sdim  /// \p Loc: The start location of the next region. If None, all active
360327952Sdim  /// regions are completed.
361327952Sdim  /// \p FirstCompletedRegion: Index of the first completed region.
362327952Sdim  void completeRegionsUntil(Optional<LineColPair> Loc,
363327952Sdim                            unsigned FirstCompletedRegion) {
364327952Sdim    // Sort the completed regions by end location. This makes it simple to
365327952Sdim    // emit closing segments in sorted order.
366327952Sdim    auto CompletedRegionsIt = ActiveRegions.begin() + FirstCompletedRegion;
367327952Sdim    std::stable_sort(CompletedRegionsIt, ActiveRegions.end(),
368327952Sdim                      [](const CountedRegion *L, const CountedRegion *R) {
369327952Sdim                        return L->endLoc() < R->endLoc();
370327952Sdim                      });
371327952Sdim
372327952Sdim    // Emit segments for all completed regions.
373327952Sdim    for (unsigned I = FirstCompletedRegion + 1, E = ActiveRegions.size(); I < E;
374327952Sdim         ++I) {
375327952Sdim      const auto *CompletedRegion = ActiveRegions[I];
376327952Sdim      assert((!Loc || CompletedRegion->endLoc() <= *Loc) &&
377327952Sdim             "Completed region ends after start of new region");
378327952Sdim
379327952Sdim      const auto *PrevCompletedRegion = ActiveRegions[I - 1];
380327952Sdim      auto CompletedSegmentLoc = PrevCompletedRegion->endLoc();
381327952Sdim
382327952Sdim      // Don't emit any more segments if they start where the new region begins.
383327952Sdim      if (Loc && CompletedSegmentLoc == *Loc)
384327952Sdim        break;
385327952Sdim
386327952Sdim      // Don't emit a segment if the next completed region ends at the same
387327952Sdim      // location as this one.
388327952Sdim      if (CompletedSegmentLoc == CompletedRegion->endLoc())
389327952Sdim        continue;
390327952Sdim
391327952Sdim      // Use the count from the last completed region which ends at this loc.
392327952Sdim      for (unsigned J = I + 1; J < E; ++J)
393327952Sdim        if (CompletedRegion->endLoc() == ActiveRegions[J]->endLoc())
394327952Sdim          CompletedRegion = ActiveRegions[J];
395327952Sdim
396327952Sdim      startSegment(*CompletedRegion, CompletedSegmentLoc, false);
397327952Sdim    }
398327952Sdim
399327952Sdim    auto Last = ActiveRegions.back();
400327952Sdim    if (FirstCompletedRegion && Last->endLoc() != *Loc) {
401327952Sdim      // If there's a gap after the end of the last completed region and the
402327952Sdim      // start of the new region, use the last active region to fill the gap.
403327952Sdim      startSegment(*ActiveRegions[FirstCompletedRegion - 1], Last->endLoc(),
404327952Sdim                   false);
405327952Sdim    } else if (!FirstCompletedRegion && (!Loc || *Loc != Last->endLoc())) {
406327952Sdim      // Emit a skipped segment if there are no more active regions. This
407327952Sdim      // ensures that gaps between functions are marked correctly.
408327952Sdim      startSegment(*Last, Last->endLoc(), false, true);
409327952Sdim    }
410327952Sdim
411327952Sdim    // Pop the completed regions.
412327952Sdim    ActiveRegions.erase(CompletedRegionsIt, ActiveRegions.end());
413303231Sdim  }
414303231Sdim
415303231Sdim  void buildSegmentsImpl(ArrayRef<CountedRegion> Regions) {
416327952Sdim    for (const auto &CR : enumerate(Regions)) {
417327952Sdim      auto CurStartLoc = CR.value().startLoc();
418327952Sdim
419327952Sdim      // Active regions which end before the current region need to be popped.
420327952Sdim      auto CompletedRegions =
421327952Sdim          std::stable_partition(ActiveRegions.begin(), ActiveRegions.end(),
422327952Sdim                                [&](const CountedRegion *Region) {
423327952Sdim                                  return !(Region->endLoc() <= CurStartLoc);
424327952Sdim                                });
425327952Sdim      if (CompletedRegions != ActiveRegions.end()) {
426327952Sdim        unsigned FirstCompletedRegion =
427327952Sdim            std::distance(ActiveRegions.begin(), CompletedRegions);
428327952Sdim        completeRegionsUntil(CurStartLoc, FirstCompletedRegion);
429327952Sdim      }
430327952Sdim
431327952Sdim      bool GapRegion = CR.value().Kind == CounterMappingRegion::GapRegion;
432327952Sdim
433327952Sdim      // Try to emit a segment for the current region.
434327952Sdim      if (CurStartLoc == CR.value().endLoc()) {
435327952Sdim        // Avoid making zero-length regions active. If it's the last region,
436327952Sdim        // emit a skipped segment. Otherwise use its predecessor's count.
437327952Sdim        const bool Skipped = (CR.index() + 1) == Regions.size();
438327952Sdim        startSegment(ActiveRegions.empty() ? CR.value() : *ActiveRegions.back(),
439327952Sdim                     CurStartLoc, !GapRegion, Skipped);
440327952Sdim        continue;
441327952Sdim      }
442327952Sdim      if (CR.index() + 1 == Regions.size() ||
443327952Sdim          CurStartLoc != Regions[CR.index() + 1].startLoc()) {
444327952Sdim        // Emit a segment if the next region doesn't start at the same location
445327952Sdim        // as this one.
446327952Sdim        startSegment(CR.value(), CurStartLoc, !GapRegion);
447327952Sdim      }
448327952Sdim
449327952Sdim      // This region is active (i.e not completed).
450327952Sdim      ActiveRegions.push_back(&CR.value());
451303231Sdim    }
452327952Sdim
453327952Sdim    // Complete any remaining active regions.
454327952Sdim    if (!ActiveRegions.empty())
455327952Sdim      completeRegionsUntil(None, 0);
456303231Sdim  }
457303231Sdim
458303231Sdim  /// Sort a nested sequence of regions from a single file.
459303231Sdim  static void sortNestedRegions(MutableArrayRef<CountedRegion> Regions) {
460303231Sdim    std::sort(Regions.begin(), Regions.end(), [](const CountedRegion &LHS,
461303231Sdim                                                 const CountedRegion &RHS) {
462303231Sdim      if (LHS.startLoc() != RHS.startLoc())
463303231Sdim        return LHS.startLoc() < RHS.startLoc();
464303231Sdim      if (LHS.endLoc() != RHS.endLoc())
465303231Sdim        // When LHS completely contains RHS, we sort LHS first.
466303231Sdim        return RHS.endLoc() < LHS.endLoc();
467303231Sdim      // If LHS and RHS cover the same area, we need to sort them according
468303231Sdim      // to their kinds so that the most suitable region will become "active"
469303231Sdim      // in combineRegions(). Because we accumulate counter values only from
470303231Sdim      // regions of the same kind as the first region of the area, prefer
471303231Sdim      // CodeRegion to ExpansionRegion and ExpansionRegion to SkippedRegion.
472321369Sdim      static_assert(CounterMappingRegion::CodeRegion <
473321369Sdim                            CounterMappingRegion::ExpansionRegion &&
474321369Sdim                        CounterMappingRegion::ExpansionRegion <
475321369Sdim                            CounterMappingRegion::SkippedRegion,
476303231Sdim                    "Unexpected order of region kind values");
477303231Sdim      return LHS.Kind < RHS.Kind;
478303231Sdim    });
479303231Sdim  }
480303231Sdim
481303231Sdim  /// Combine counts of regions which cover the same area.
482303231Sdim  static ArrayRef<CountedRegion>
483303231Sdim  combineRegions(MutableArrayRef<CountedRegion> Regions) {
484303231Sdim    if (Regions.empty())
485303231Sdim      return Regions;
486303231Sdim    auto Active = Regions.begin();
487303231Sdim    auto End = Regions.end();
488303231Sdim    for (auto I = Regions.begin() + 1; I != End; ++I) {
489303231Sdim      if (Active->startLoc() != I->startLoc() ||
490303231Sdim          Active->endLoc() != I->endLoc()) {
491303231Sdim        // Shift to the next region.
492303231Sdim        ++Active;
493303231Sdim        if (Active != I)
494303231Sdim          *Active = *I;
495303231Sdim        continue;
496303231Sdim      }
497303231Sdim      // Merge duplicate region.
498303231Sdim      // If CodeRegions and ExpansionRegions cover the same area, it's probably
499303231Sdim      // a macro which is fully expanded to another macro. In that case, we need
500303231Sdim      // to accumulate counts only from CodeRegions, or else the area will be
501303231Sdim      // counted twice.
502303231Sdim      // On the other hand, a macro may have a nested macro in its body. If the
503303231Sdim      // outer macro is used several times, the ExpansionRegion for the nested
504303231Sdim      // macro will also be added several times. These ExpansionRegions cover
505303231Sdim      // the same source locations and have to be combined to reach the correct
506303231Sdim      // value for that area.
507303231Sdim      // We add counts of the regions of the same kind as the active region
508303231Sdim      // to handle the both situations.
509303231Sdim      if (I->Kind == Active->Kind)
510303231Sdim        Active->ExecutionCount += I->ExecutionCount;
511303231Sdim    }
512303231Sdim    return Regions.drop_back(std::distance(++Active, End));
513303231Sdim  }
514303231Sdim
515303231Sdimpublic:
516327952Sdim  /// Build a sorted list of CoverageSegments from a list of Regions.
517303231Sdim  static std::vector<CoverageSegment>
518303231Sdim  buildSegments(MutableArrayRef<CountedRegion> Regions) {
519303231Sdim    std::vector<CoverageSegment> Segments;
520303231Sdim    SegmentBuilder Builder(Segments);
521303231Sdim
522303231Sdim    sortNestedRegions(Regions);
523303231Sdim    ArrayRef<CountedRegion> CombinedRegions = combineRegions(Regions);
524303231Sdim
525327952Sdim    DEBUG({
526327952Sdim      dbgs() << "Combined regions:\n";
527327952Sdim      for (const auto &CR : CombinedRegions)
528327952Sdim        dbgs() << "  " << CR.LineStart << ":" << CR.ColumnStart << " -> "
529327952Sdim               << CR.LineEnd << ":" << CR.ColumnEnd
530327952Sdim               << " (count=" << CR.ExecutionCount << ")\n";
531327952Sdim    });
532327952Sdim
533303231Sdim    Builder.buildSegmentsImpl(CombinedRegions);
534327952Sdim
535327952Sdim#ifndef NDEBUG
536327952Sdim    for (unsigned I = 1, E = Segments.size(); I < E; ++I) {
537327952Sdim      const auto &L = Segments[I - 1];
538327952Sdim      const auto &R = Segments[I];
539327952Sdim      if (!(L.Line < R.Line) && !(L.Line == R.Line && L.Col < R.Col)) {
540327952Sdim        DEBUG(dbgs() << " ! Segment " << L.Line << ":" << L.Col
541327952Sdim                     << " followed by " << R.Line << ":" << R.Col << "\n");
542327952Sdim        assert(false && "Coverage segments not unique or sorted");
543327952Sdim      }
544327952Sdim    }
545327952Sdim#endif
546327952Sdim
547303231Sdim    return Segments;
548303231Sdim  }
549303231Sdim};
550303231Sdim
551321369Sdim} // end anonymous namespace
552321369Sdim
553303231Sdimstd::vector<StringRef> CoverageMapping::getUniqueSourceFiles() const {
554303231Sdim  std::vector<StringRef> Filenames;
555303231Sdim  for (const auto &Function : getCoveredFunctions())
556303231Sdim    Filenames.insert(Filenames.end(), Function.Filenames.begin(),
557303231Sdim                     Function.Filenames.end());
558303231Sdim  std::sort(Filenames.begin(), Filenames.end());
559303231Sdim  auto Last = std::unique(Filenames.begin(), Filenames.end());
560303231Sdim  Filenames.erase(Last, Filenames.end());
561303231Sdim  return Filenames;
562303231Sdim}
563303231Sdim
564303231Sdimstatic SmallBitVector gatherFileIDs(StringRef SourceFile,
565303231Sdim                                    const FunctionRecord &Function) {
566303231Sdim  SmallBitVector FilenameEquivalence(Function.Filenames.size(), false);
567303231Sdim  for (unsigned I = 0, E = Function.Filenames.size(); I < E; ++I)
568303231Sdim    if (SourceFile == Function.Filenames[I])
569303231Sdim      FilenameEquivalence[I] = true;
570303231Sdim  return FilenameEquivalence;
571303231Sdim}
572303231Sdim
573303231Sdim/// Return the ID of the file where the definition of the function is located.
574303231Sdimstatic Optional<unsigned> findMainViewFileID(const FunctionRecord &Function) {
575303231Sdim  SmallBitVector IsNotExpandedFile(Function.Filenames.size(), true);
576303231Sdim  for (const auto &CR : Function.CountedRegions)
577303231Sdim    if (CR.Kind == CounterMappingRegion::ExpansionRegion)
578303231Sdim      IsNotExpandedFile[CR.ExpandedFileID] = false;
579303231Sdim  int I = IsNotExpandedFile.find_first();
580303231Sdim  if (I == -1)
581303231Sdim    return None;
582303231Sdim  return I;
583303231Sdim}
584303231Sdim
585303231Sdim/// Check if SourceFile is the file that contains the definition of
586303231Sdim/// the Function. Return the ID of the file in that case or None otherwise.
587303231Sdimstatic Optional<unsigned> findMainViewFileID(StringRef SourceFile,
588303231Sdim                                             const FunctionRecord &Function) {
589303231Sdim  Optional<unsigned> I = findMainViewFileID(Function);
590303231Sdim  if (I && SourceFile == Function.Filenames[*I])
591303231Sdim    return I;
592303231Sdim  return None;
593303231Sdim}
594303231Sdim
595303231Sdimstatic bool isExpansion(const CountedRegion &R, unsigned FileID) {
596303231Sdim  return R.Kind == CounterMappingRegion::ExpansionRegion && R.FileID == FileID;
597303231Sdim}
598303231Sdim
599303231SdimCoverageData CoverageMapping::getCoverageForFile(StringRef Filename) const {
600303231Sdim  CoverageData FileCoverage(Filename);
601321369Sdim  std::vector<CountedRegion> Regions;
602303231Sdim
603303231Sdim  for (const auto &Function : Functions) {
604303231Sdim    auto MainFileID = findMainViewFileID(Filename, Function);
605303231Sdim    auto FileIDs = gatherFileIDs(Filename, Function);
606303231Sdim    for (const auto &CR : Function.CountedRegions)
607303231Sdim      if (FileIDs.test(CR.FileID)) {
608303231Sdim        Regions.push_back(CR);
609303231Sdim        if (MainFileID && isExpansion(CR, *MainFileID))
610303231Sdim          FileCoverage.Expansions.emplace_back(CR, Function);
611303231Sdim      }
612303231Sdim  }
613303231Sdim
614303231Sdim  DEBUG(dbgs() << "Emitting segments for file: " << Filename << "\n");
615303231Sdim  FileCoverage.Segments = SegmentBuilder::buildSegments(Regions);
616303231Sdim
617303231Sdim  return FileCoverage;
618303231Sdim}
619303231Sdim
620327952Sdimstd::vector<InstantiationGroup>
621327952SdimCoverageMapping::getInstantiationGroups(StringRef Filename) const {
622303231Sdim  FunctionInstantiationSetCollector InstantiationSetCollector;
623303231Sdim  for (const auto &Function : Functions) {
624303231Sdim    auto MainFileID = findMainViewFileID(Filename, Function);
625303231Sdim    if (!MainFileID)
626303231Sdim      continue;
627303231Sdim    InstantiationSetCollector.insert(Function, *MainFileID);
628303231Sdim  }
629303231Sdim
630327952Sdim  std::vector<InstantiationGroup> Result;
631327952Sdim  for (auto &InstantiationSet : InstantiationSetCollector) {
632327952Sdim    InstantiationGroup IG{InstantiationSet.first.first,
633327952Sdim                          InstantiationSet.first.second,
634327952Sdim                          std::move(InstantiationSet.second)};
635327952Sdim    Result.emplace_back(std::move(IG));
636303231Sdim  }
637303231Sdim  return Result;
638303231Sdim}
639303231Sdim
640303231SdimCoverageData
641303231SdimCoverageMapping::getCoverageForFunction(const FunctionRecord &Function) const {
642303231Sdim  auto MainFileID = findMainViewFileID(Function);
643303231Sdim  if (!MainFileID)
644303231Sdim    return CoverageData();
645303231Sdim
646303231Sdim  CoverageData FunctionCoverage(Function.Filenames[*MainFileID]);
647321369Sdim  std::vector<CountedRegion> Regions;
648303231Sdim  for (const auto &CR : Function.CountedRegions)
649303231Sdim    if (CR.FileID == *MainFileID) {
650303231Sdim      Regions.push_back(CR);
651303231Sdim      if (isExpansion(CR, *MainFileID))
652303231Sdim        FunctionCoverage.Expansions.emplace_back(CR, Function);
653303231Sdim    }
654303231Sdim
655303231Sdim  DEBUG(dbgs() << "Emitting segments for function: " << Function.Name << "\n");
656303231Sdim  FunctionCoverage.Segments = SegmentBuilder::buildSegments(Regions);
657303231Sdim
658303231Sdim  return FunctionCoverage;
659303231Sdim}
660303231Sdim
661303231SdimCoverageData CoverageMapping::getCoverageForExpansion(
662303231Sdim    const ExpansionRecord &Expansion) const {
663303231Sdim  CoverageData ExpansionCoverage(
664303231Sdim      Expansion.Function.Filenames[Expansion.FileID]);
665321369Sdim  std::vector<CountedRegion> Regions;
666303231Sdim  for (const auto &CR : Expansion.Function.CountedRegions)
667303231Sdim    if (CR.FileID == Expansion.FileID) {
668303231Sdim      Regions.push_back(CR);
669303231Sdim      if (isExpansion(CR, Expansion.FileID))
670303231Sdim        ExpansionCoverage.Expansions.emplace_back(CR, Expansion.Function);
671303231Sdim    }
672303231Sdim
673303231Sdim  DEBUG(dbgs() << "Emitting segments for expansion of file " << Expansion.FileID
674303231Sdim               << "\n");
675303231Sdim  ExpansionCoverage.Segments = SegmentBuilder::buildSegments(Regions);
676303231Sdim
677303231Sdim  return ExpansionCoverage;
678303231Sdim}
679303231Sdim
680327952SdimLineCoverageStats::LineCoverageStats(
681327952Sdim    ArrayRef<const CoverageSegment *> LineSegments,
682327952Sdim    const CoverageSegment *WrappedSegment, unsigned Line)
683327952Sdim    : ExecutionCount(0), HasMultipleRegions(false), Mapped(false), Line(Line),
684327952Sdim      LineSegments(LineSegments), WrappedSegment(WrappedSegment) {
685327952Sdim  // Find the minimum number of regions which start in this line.
686327952Sdim  unsigned MinRegionCount = 0;
687327952Sdim  auto isStartOfRegion = [](const CoverageSegment *S) {
688327952Sdim    return !S->IsGapRegion && S->HasCount && S->IsRegionEntry;
689327952Sdim  };
690327952Sdim  for (unsigned I = 0; I < LineSegments.size() && MinRegionCount < 2; ++I)
691327952Sdim    if (isStartOfRegion(LineSegments[I]))
692327952Sdim      ++MinRegionCount;
693327952Sdim
694327952Sdim  bool StartOfSkippedRegion = !LineSegments.empty() &&
695327952Sdim                              !LineSegments.front()->HasCount &&
696327952Sdim                              LineSegments.front()->IsRegionEntry;
697327952Sdim
698327952Sdim  HasMultipleRegions = MinRegionCount > 1;
699327952Sdim  Mapped =
700327952Sdim      !StartOfSkippedRegion &&
701327952Sdim      ((WrappedSegment && WrappedSegment->HasCount) || (MinRegionCount > 0));
702327952Sdim
703327952Sdim  if (!Mapped)
704327952Sdim    return;
705327952Sdim
706327952Sdim  // Pick the max count from the non-gap, region entry segments and the
707327952Sdim  // wrapped count.
708327952Sdim  if (WrappedSegment)
709327952Sdim    ExecutionCount = WrappedSegment->Count;
710327952Sdim  if (!MinRegionCount)
711327952Sdim    return;
712327952Sdim  for (const auto *LS : LineSegments)
713327952Sdim    if (isStartOfRegion(LS))
714327952Sdim      ExecutionCount = std::max(ExecutionCount, LS->Count);
715327952Sdim}
716327952Sdim
717327952SdimLineCoverageIterator &LineCoverageIterator::operator++() {
718327952Sdim  if (Next == CD.end()) {
719327952Sdim    Stats = LineCoverageStats();
720327952Sdim    Ended = true;
721327952Sdim    return *this;
722327952Sdim  }
723327952Sdim  if (Segments.size())
724327952Sdim    WrappedSegment = Segments.back();
725327952Sdim  Segments.clear();
726327952Sdim  while (Next != CD.end() && Next->Line == Line)
727327952Sdim    Segments.push_back(&*Next++);
728327952Sdim  Stats = LineCoverageStats(Segments, WrappedSegment, Line);
729327952Sdim  ++Line;
730327952Sdim  return *this;
731327952Sdim}
732327952Sdim
733321369Sdimstatic std::string getCoverageMapErrString(coveragemap_error Err) {
734303231Sdim  switch (Err) {
735303231Sdim  case coveragemap_error::success:
736303231Sdim    return "Success";
737303231Sdim  case coveragemap_error::eof:
738303231Sdim    return "End of File";
739303231Sdim  case coveragemap_error::no_data_found:
740303231Sdim    return "No coverage data found";
741303231Sdim  case coveragemap_error::unsupported_version:
742303231Sdim    return "Unsupported coverage format version";
743303231Sdim  case coveragemap_error::truncated:
744303231Sdim    return "Truncated coverage data";
745303231Sdim  case coveragemap_error::malformed:
746303231Sdim    return "Malformed coverage data";
747303231Sdim  }
748303231Sdim  llvm_unreachable("A value of coveragemap_error has no message.");
749303231Sdim}
750303231Sdim
751321369Sdimnamespace {
752321369Sdim
753303231Sdim// FIXME: This class is only here to support the transition to llvm::Error. It
754303231Sdim// will be removed once this transition is complete. Clients should prefer to
755303231Sdim// deal with the Error value directly, rather than converting to error_code.
756303231Sdimclass CoverageMappingErrorCategoryType : public std::error_category {
757314564Sdim  const char *name() const noexcept override { return "llvm.coveragemap"; }
758303231Sdim  std::string message(int IE) const override {
759303231Sdim    return getCoverageMapErrString(static_cast<coveragemap_error>(IE));
760303231Sdim  }
761303231Sdim};
762321369Sdim
763303231Sdim} // end anonymous namespace
764303231Sdim
765303231Sdimstd::string CoverageMapError::message() const {
766303231Sdim  return getCoverageMapErrString(Err);
767303231Sdim}
768303231Sdim
769303231Sdimstatic ManagedStatic<CoverageMappingErrorCategoryType> ErrorCategory;
770303231Sdim
771303231Sdimconst std::error_category &llvm::coverage::coveragemap_category() {
772303231Sdim  return *ErrorCategory;
773303231Sdim}
774303231Sdim
775303231Sdimchar CoverageMapError::ID = 0;
776