clang 20.0.0git
CoverageMappingGen.cpp
Go to the documentation of this file.
1//===--- CoverageMappingGen.cpp - Coverage mapping generation ---*- C++ -*-===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// Instrumentation-based code coverage mapping generator
10//
11//===----------------------------------------------------------------------===//
12
13#include "CoverageMappingGen.h"
14#include "CodeGenFunction.h"
19#include "clang/Lex/Lexer.h"
20#include "llvm/ADT/DenseSet.h"
21#include "llvm/ADT/SmallSet.h"
22#include "llvm/ADT/StringExtras.h"
23#include "llvm/ProfileData/Coverage/CoverageMapping.h"
24#include "llvm/ProfileData/Coverage/CoverageMappingReader.h"
25#include "llvm/ProfileData/Coverage/CoverageMappingWriter.h"
26#include "llvm/ProfileData/InstrProfReader.h"
27#include "llvm/Support/FileSystem.h"
28#include "llvm/Support/Path.h"
29#include <optional>
30
31// This selects the coverage mapping format defined when `InstrProfData.inc`
32// is textually included.
33#define COVMAP_V3
34
35namespace llvm {
36cl::opt<bool>
37 EnableSingleByteCoverage("enable-single-byte-coverage",
38 llvm::cl::ZeroOrMore,
39 llvm::cl::desc("Enable single byte coverage"),
40 llvm::cl::Hidden, llvm::cl::init(false));
41} // namespace llvm
42
43static llvm::cl::opt<bool> EmptyLineCommentCoverage(
44 "emptyline-comment-coverage",
45 llvm::cl::desc("Emit emptylines and comment lines as skipped regions (only "
46 "disable it on test)"),
47 llvm::cl::init(true), llvm::cl::Hidden);
48
49namespace llvm::coverage {
51 "system-headers-coverage",
52 cl::desc("Enable collecting coverage from system headers"), cl::init(false),
53 cl::Hidden);
54}
55
56using namespace clang;
57using namespace CodeGen;
58using namespace llvm::coverage;
59
62 CoverageSourceInfo *CoverageInfo =
64 PP.addPPCallbacks(std::unique_ptr<PPCallbacks>(CoverageInfo));
66 PP.addCommentHandler(CoverageInfo);
67 PP.setEmptylineHandler(CoverageInfo);
68 PP.setPreprocessToken(true);
69 PP.setTokenWatcher([CoverageInfo](clang::Token Tok) {
70 // Update previous token location.
71 CoverageInfo->PrevTokLoc = Tok.getLocation();
72 if (Tok.getKind() != clang::tok::eod)
73 CoverageInfo->updateNextTokLoc(Tok.getLocation());
74 });
75 }
76 return CoverageInfo;
77}
78
80 SkippedRange::Kind RangeKind) {
81 if (EmptyLineCommentCoverage && !SkippedRanges.empty() &&
82 PrevTokLoc == SkippedRanges.back().PrevTokLoc &&
83 SourceMgr.isWrittenInSameFile(SkippedRanges.back().Range.getEnd(),
84 Range.getBegin()))
85 SkippedRanges.back().Range.setEnd(Range.getEnd());
86 else
87 SkippedRanges.push_back({Range, RangeKind, PrevTokLoc});
88}
89
91 AddSkippedRange(Range, SkippedRange::PPIfElse);
92}
93
95 AddSkippedRange(Range, SkippedRange::EmptyLine);
96}
97
99 AddSkippedRange(Range, SkippedRange::Comment);
100 return false;
101}
102
104 if (!SkippedRanges.empty() && SkippedRanges.back().NextTokLoc.isInvalid())
105 SkippedRanges.back().NextTokLoc = Loc;
106}
107
108namespace {
109/// A region of source code that can be mapped to a counter.
110class SourceMappingRegion {
111 /// Primary Counter that is also used for Branch Regions for "True" branches.
112 Counter Count;
113
114 /// Secondary Counter used for Branch Regions for "False" branches.
115 std::optional<Counter> FalseCount;
116
117 /// Parameters used for Modified Condition/Decision Coverage
118 mcdc::Parameters MCDCParams;
119
120 /// The region's starting location.
121 std::optional<SourceLocation> LocStart;
122
123 /// The region's ending location.
124 std::optional<SourceLocation> LocEnd;
125
126 /// Whether this region is a gap region. The count from a gap region is set
127 /// as the line execution count if there are no other regions on the line.
128 bool GapRegion;
129
130 /// Whetever this region is skipped ('if constexpr' or 'if consteval' untaken
131 /// branch, or anything skipped but not empty line / comments)
132 bool SkippedRegion;
133
134public:
135 SourceMappingRegion(Counter Count, std::optional<SourceLocation> LocStart,
136 std::optional<SourceLocation> LocEnd,
137 bool GapRegion = false)
138 : Count(Count), LocStart(LocStart), LocEnd(LocEnd), GapRegion(GapRegion),
139 SkippedRegion(false) {}
140
141 SourceMappingRegion(Counter Count, std::optional<Counter> FalseCount,
142 mcdc::Parameters MCDCParams,
143 std::optional<SourceLocation> LocStart,
144 std::optional<SourceLocation> LocEnd,
145 bool GapRegion = false)
146 : Count(Count), FalseCount(FalseCount), MCDCParams(MCDCParams),
147 LocStart(LocStart), LocEnd(LocEnd), GapRegion(GapRegion),
148 SkippedRegion(false) {}
149
150 SourceMappingRegion(mcdc::Parameters MCDCParams,
151 std::optional<SourceLocation> LocStart,
152 std::optional<SourceLocation> LocEnd)
153 : MCDCParams(MCDCParams), LocStart(LocStart), LocEnd(LocEnd),
154 GapRegion(false), SkippedRegion(false) {}
155
156 const Counter &getCounter() const { return Count; }
157
158 const Counter &getFalseCounter() const {
159 assert(FalseCount && "Region has no alternate counter");
160 return *FalseCount;
161 }
162
163 void setCounter(Counter C) { Count = C; }
164
165 bool hasStartLoc() const { return LocStart.has_value(); }
166
167 void setStartLoc(SourceLocation Loc) { LocStart = Loc; }
168
169 SourceLocation getBeginLoc() const {
170 assert(LocStart && "Region has no start location");
171 return *LocStart;
172 }
173
174 bool hasEndLoc() const { return LocEnd.has_value(); }
175
176 void setEndLoc(SourceLocation Loc) {
177 assert(Loc.isValid() && "Setting an invalid end location");
178 LocEnd = Loc;
179 }
180
181 SourceLocation getEndLoc() const {
182 assert(LocEnd && "Region has no end location");
183 return *LocEnd;
184 }
185
186 bool isGap() const { return GapRegion; }
187
188 void setGap(bool Gap) { GapRegion = Gap; }
189
190 bool isSkipped() const { return SkippedRegion; }
191
192 void setSkipped(bool Skipped) { SkippedRegion = Skipped; }
193
194 bool isBranch() const { return FalseCount.has_value(); }
195
196 bool isMCDCBranch() const {
197 return std::holds_alternative<mcdc::BranchParameters>(MCDCParams);
198 }
199
200 const auto &getMCDCBranchParams() const {
201 return mcdc::getParams<const mcdc::BranchParameters>(MCDCParams);
202 }
203
204 bool isMCDCDecision() const {
205 return std::holds_alternative<mcdc::DecisionParameters>(MCDCParams);
206 }
207
208 const auto &getMCDCDecisionParams() const {
209 return mcdc::getParams<const mcdc::DecisionParameters>(MCDCParams);
210 }
211
212 const mcdc::Parameters &getMCDCParams() const { return MCDCParams; }
213
214 void resetMCDCParams() { MCDCParams = mcdc::Parameters(); }
215};
216
217/// Spelling locations for the start and end of a source region.
218struct SpellingRegion {
219 /// The line where the region starts.
220 unsigned LineStart;
221
222 /// The column where the region starts.
223 unsigned ColumnStart;
224
225 /// The line where the region ends.
226 unsigned LineEnd;
227
228 /// The column where the region ends.
229 unsigned ColumnEnd;
230
231 SpellingRegion(SourceManager &SM, SourceLocation LocStart,
232 SourceLocation LocEnd) {
233 LineStart = SM.getSpellingLineNumber(LocStart);
234 ColumnStart = SM.getSpellingColumnNumber(LocStart);
235 LineEnd = SM.getSpellingLineNumber(LocEnd);
236 ColumnEnd = SM.getSpellingColumnNumber(LocEnd);
237 }
238
239 SpellingRegion(SourceManager &SM, SourceMappingRegion &R)
240 : SpellingRegion(SM, R.getBeginLoc(), R.getEndLoc()) {}
241
242 /// Check if the start and end locations appear in source order, i.e
243 /// top->bottom, left->right.
244 bool isInSourceOrder() const {
245 return (LineStart < LineEnd) ||
246 (LineStart == LineEnd && ColumnStart <= ColumnEnd);
247 }
248};
249
250/// Provides the common functionality for the different
251/// coverage mapping region builders.
252class CoverageMappingBuilder {
253public:
256 const LangOptions &LangOpts;
257
258private:
259 /// Map of clang's FileIDs to IDs used for coverage mapping.
260 llvm::SmallDenseMap<FileID, std::pair<unsigned, SourceLocation>, 8>
261 FileIDMapping;
262
263public:
264 /// The coverage mapping regions for this function
266 /// The source mapping regions for this function.
267 std::vector<SourceMappingRegion> SourceRegions;
268
269 /// A set of regions which can be used as a filter.
270 ///
271 /// It is produced by emitExpansionRegions() and is used in
272 /// emitSourceRegions() to suppress producing code regions if
273 /// the same area is covered by expansion regions.
274 typedef llvm::SmallSet<std::pair<SourceLocation, SourceLocation>, 8>
275 SourceRegionFilter;
276
277 CoverageMappingBuilder(CoverageMappingModuleGen &CVM, SourceManager &SM,
278 const LangOptions &LangOpts)
279 : CVM(CVM), SM(SM), LangOpts(LangOpts) {}
280
281 /// Return the precise end location for the given token.
282 SourceLocation getPreciseTokenLocEnd(SourceLocation Loc) {
283 // We avoid getLocForEndOfToken here, because it doesn't do what we want for
284 // macro locations, which we just treat as expanded files.
285 unsigned TokLen =
286 Lexer::MeasureTokenLength(SM.getSpellingLoc(Loc), SM, LangOpts);
287 return Loc.getLocWithOffset(TokLen);
288 }
289
290 /// Return the start location of an included file or expanded macro.
291 SourceLocation getStartOfFileOrMacro(SourceLocation Loc) {
292 if (Loc.isMacroID())
293 return Loc.getLocWithOffset(-SM.getFileOffset(Loc));
294 return SM.getLocForStartOfFile(SM.getFileID(Loc));
295 }
296
297 /// Return the end location of an included file or expanded macro.
298 SourceLocation getEndOfFileOrMacro(SourceLocation Loc) {
299 if (Loc.isMacroID())
300 return Loc.getLocWithOffset(SM.getFileIDSize(SM.getFileID(Loc)) -
301 SM.getFileOffset(Loc));
302 return SM.getLocForEndOfFile(SM.getFileID(Loc));
303 }
304
305 /// Find out where a macro is expanded. If the immediate result is a
306 /// <scratch space>, keep looking until the result isn't. Return a pair of
307 /// \c SourceLocation. The first object is always the begin sloc of found
308 /// result. The second should be checked by the caller: if it has value, it's
309 /// the end sloc of the found result. Otherwise the while loop didn't get
310 /// executed, which means the location wasn't changed and the caller has to
311 /// learn the end sloc from somewhere else.
312 std::pair<SourceLocation, std::optional<SourceLocation>>
313 getNonScratchExpansionLoc(SourceLocation Loc) {
314 std::optional<SourceLocation> EndLoc = std::nullopt;
315 while (Loc.isMacroID() &&
316 SM.isWrittenInScratchSpace(SM.getSpellingLoc(Loc))) {
317 auto ExpansionRange = SM.getImmediateExpansionRange(Loc);
318 Loc = ExpansionRange.getBegin();
319 EndLoc = ExpansionRange.getEnd();
320 }
321 return std::make_pair(Loc, EndLoc);
322 }
323
324 /// Find out where the current file is included or macro is expanded. If
325 /// \c AcceptScratch is set to false, keep looking for expansions until the
326 /// found sloc is not a <scratch space>.
327 SourceLocation getIncludeOrExpansionLoc(SourceLocation Loc,
328 bool AcceptScratch = true) {
329 if (!Loc.isMacroID())
330 return SM.getIncludeLoc(SM.getFileID(Loc));
331 Loc = SM.getImmediateExpansionRange(Loc).getBegin();
332 if (AcceptScratch)
333 return Loc;
334 return getNonScratchExpansionLoc(Loc).first;
335 }
336
337 /// Return true if \c Loc is a location in a built-in macro.
338 bool isInBuiltin(SourceLocation Loc) {
339 return SM.getBufferName(SM.getSpellingLoc(Loc)) == "<built-in>";
340 }
341
342 /// Check whether \c Loc is included or expanded from \c Parent.
343 bool isNestedIn(SourceLocation Loc, FileID Parent) {
344 do {
345 Loc = getIncludeOrExpansionLoc(Loc);
346 if (Loc.isInvalid())
347 return false;
348 } while (!SM.isInFileID(Loc, Parent));
349 return true;
350 }
351
352 /// Get the start of \c S ignoring macro arguments and builtin macros.
353 SourceLocation getStart(const Stmt *S) {
354 SourceLocation Loc = S->getBeginLoc();
355 while (SM.isMacroArgExpansion(Loc) || isInBuiltin(Loc))
356 Loc = SM.getImmediateExpansionRange(Loc).getBegin();
357 return Loc;
358 }
359
360 /// Get the end of \c S ignoring macro arguments and builtin macros.
361 SourceLocation getEnd(const Stmt *S) {
362 SourceLocation Loc = S->getEndLoc();
363 while (SM.isMacroArgExpansion(Loc) || isInBuiltin(Loc))
364 Loc = SM.getImmediateExpansionRange(Loc).getBegin();
365 return getPreciseTokenLocEnd(Loc);
366 }
367
368 /// Find the set of files we have regions for and assign IDs
369 ///
370 /// Fills \c Mapping with the virtual file mapping needed to write out
371 /// coverage and collects the necessary file information to emit source and
372 /// expansion regions.
373 void gatherFileIDs(SmallVectorImpl<unsigned> &Mapping) {
374 FileIDMapping.clear();
375
376 llvm::SmallSet<FileID, 8> Visited;
378 for (auto &Region : SourceRegions) {
379 SourceLocation Loc = Region.getBeginLoc();
380
381 // Replace Region with its definition if it is in <scratch space>.
382 auto NonScratchExpansionLoc = getNonScratchExpansionLoc(Loc);
383 auto EndLoc = NonScratchExpansionLoc.second;
384 if (EndLoc.has_value()) {
385 Loc = NonScratchExpansionLoc.first;
386 Region.setStartLoc(Loc);
387 Region.setEndLoc(EndLoc.value());
388 }
389
390 // Replace Loc with FileLoc if it is expanded with system headers.
391 if (!SystemHeadersCoverage && SM.isInSystemMacro(Loc)) {
392 auto BeginLoc = SM.getSpellingLoc(Loc);
393 auto EndLoc = SM.getSpellingLoc(Region.getEndLoc());
394 if (SM.isWrittenInSameFile(BeginLoc, EndLoc)) {
395 Loc = SM.getFileLoc(Loc);
396 Region.setStartLoc(Loc);
397 Region.setEndLoc(SM.getFileLoc(Region.getEndLoc()));
398 }
399 }
400
401 FileID File = SM.getFileID(Loc);
402 if (!Visited.insert(File).second)
403 continue;
404
405 assert(SystemHeadersCoverage ||
406 !SM.isInSystemHeader(SM.getSpellingLoc(Loc)));
407
408 unsigned Depth = 0;
409 for (SourceLocation Parent = getIncludeOrExpansionLoc(Loc);
410 Parent.isValid(); Parent = getIncludeOrExpansionLoc(Parent))
411 ++Depth;
412 FileLocs.push_back(std::make_pair(Loc, Depth));
413 }
414 llvm::stable_sort(FileLocs, llvm::less_second());
415
416 for (const auto &FL : FileLocs) {
417 SourceLocation Loc = FL.first;
418 FileID SpellingFile = SM.getDecomposedSpellingLoc(Loc).first;
419 auto Entry = SM.getFileEntryRefForID(SpellingFile);
420 if (!Entry)
421 continue;
422
423 FileIDMapping[SM.getFileID(Loc)] = std::make_pair(Mapping.size(), Loc);
424 Mapping.push_back(CVM.getFileID(*Entry));
425 }
426 }
427
428 /// Get the coverage mapping file ID for \c Loc.
429 ///
430 /// If such file id doesn't exist, return std::nullopt.
431 std::optional<unsigned> getCoverageFileID(SourceLocation Loc) {
432 auto Mapping = FileIDMapping.find(SM.getFileID(Loc));
433 if (Mapping != FileIDMapping.end())
434 return Mapping->second.first;
435 return std::nullopt;
436 }
437
438 /// This shrinks the skipped range if it spans a line that contains a
439 /// non-comment token. If shrinking the skipped range would make it empty,
440 /// this returns std::nullopt.
441 /// Note this function can potentially be expensive because
442 /// getSpellingLineNumber uses getLineNumber, which is expensive.
443 std::optional<SpellingRegion> adjustSkippedRange(SourceManager &SM,
444 SourceLocation LocStart,
445 SourceLocation LocEnd,
446 SourceLocation PrevTokLoc,
447 SourceLocation NextTokLoc) {
448 SpellingRegion SR{SM, LocStart, LocEnd};
449 SR.ColumnStart = 1;
450 if (PrevTokLoc.isValid() && SM.isWrittenInSameFile(LocStart, PrevTokLoc) &&
451 SR.LineStart == SM.getSpellingLineNumber(PrevTokLoc))
452 SR.LineStart++;
453 if (NextTokLoc.isValid() && SM.isWrittenInSameFile(LocEnd, NextTokLoc) &&
454 SR.LineEnd == SM.getSpellingLineNumber(NextTokLoc)) {
455 SR.LineEnd--;
456 SR.ColumnEnd++;
457 }
458 if (SR.isInSourceOrder())
459 return SR;
460 return std::nullopt;
461 }
462
463 /// Gather all the regions that were skipped by the preprocessor
464 /// using the constructs like #if or comments.
465 void gatherSkippedRegions() {
466 /// An array of the minimum lineStarts and the maximum lineEnds
467 /// for mapping regions from the appropriate source files.
469 FileLineRanges.resize(
470 FileIDMapping.size(),
471 std::make_pair(std::numeric_limits<unsigned>::max(), 0));
472 for (const auto &R : MappingRegions) {
473 FileLineRanges[R.FileID].first =
474 std::min(FileLineRanges[R.FileID].first, R.LineStart);
475 FileLineRanges[R.FileID].second =
476 std::max(FileLineRanges[R.FileID].second, R.LineEnd);
477 }
478
479 auto SkippedRanges = CVM.getSourceInfo().getSkippedRanges();
480 for (auto &I : SkippedRanges) {
481 SourceRange Range = I.Range;
482 auto LocStart = Range.getBegin();
483 auto LocEnd = Range.getEnd();
484 assert(SM.isWrittenInSameFile(LocStart, LocEnd) &&
485 "region spans multiple files");
486
487 auto CovFileID = getCoverageFileID(LocStart);
488 if (!CovFileID)
489 continue;
490 std::optional<SpellingRegion> SR;
491 if (I.isComment())
492 SR = adjustSkippedRange(SM, LocStart, LocEnd, I.PrevTokLoc,
493 I.NextTokLoc);
494 else if (I.isPPIfElse() || I.isEmptyLine())
495 SR = {SM, LocStart, LocEnd};
496
497 if (!SR)
498 continue;
499 auto Region = CounterMappingRegion::makeSkipped(
500 *CovFileID, SR->LineStart, SR->ColumnStart, SR->LineEnd,
501 SR->ColumnEnd);
502 // Make sure that we only collect the regions that are inside
503 // the source code of this function.
504 if (Region.LineStart >= FileLineRanges[*CovFileID].first &&
505 Region.LineEnd <= FileLineRanges[*CovFileID].second)
506 MappingRegions.push_back(Region);
507 }
508 }
509
510 /// Generate the coverage counter mapping regions from collected
511 /// source regions.
512 void emitSourceRegions(const SourceRegionFilter &Filter) {
513 for (const auto &Region : SourceRegions) {
514 assert(Region.hasEndLoc() && "incomplete region");
515
516 SourceLocation LocStart = Region.getBeginLoc();
517 assert(SM.getFileID(LocStart).isValid() && "region in invalid file");
518
519 // Ignore regions from system headers unless collecting coverage from
520 // system headers is explicitly enabled.
522 SM.isInSystemHeader(SM.getSpellingLoc(LocStart))) {
523 assert(!Region.isMCDCBranch() && !Region.isMCDCDecision() &&
524 "Don't suppress the condition in system headers");
525 continue;
526 }
527
528 auto CovFileID = getCoverageFileID(LocStart);
529 // Ignore regions that don't have a file, such as builtin macros.
530 if (!CovFileID) {
531 assert(!Region.isMCDCBranch() && !Region.isMCDCDecision() &&
532 "Don't suppress the condition in non-file regions");
533 continue;
534 }
535
536 SourceLocation LocEnd = Region.getEndLoc();
537 assert(SM.isWrittenInSameFile(LocStart, LocEnd) &&
538 "region spans multiple files");
539
540 // Don't add code regions for the area covered by expansion regions.
541 // This not only suppresses redundant regions, but sometimes prevents
542 // creating regions with wrong counters if, for example, a statement's
543 // body ends at the end of a nested macro.
544 if (Filter.count(std::make_pair(LocStart, LocEnd))) {
545 assert(!Region.isMCDCBranch() && !Region.isMCDCDecision() &&
546 "Don't suppress the condition");
547 continue;
548 }
549
550 // Find the spelling locations for the mapping region.
551 SpellingRegion SR{SM, LocStart, LocEnd};
552 assert(SR.isInSourceOrder() && "region start and end out of order");
553
554 if (Region.isGap()) {
555 MappingRegions.push_back(CounterMappingRegion::makeGapRegion(
556 Region.getCounter(), *CovFileID, SR.LineStart, SR.ColumnStart,
557 SR.LineEnd, SR.ColumnEnd));
558 } else if (Region.isSkipped()) {
559 MappingRegions.push_back(CounterMappingRegion::makeSkipped(
560 *CovFileID, SR.LineStart, SR.ColumnStart, SR.LineEnd,
561 SR.ColumnEnd));
562 } else if (Region.isBranch()) {
563 MappingRegions.push_back(CounterMappingRegion::makeBranchRegion(
564 Region.getCounter(), Region.getFalseCounter(), *CovFileID,
565 SR.LineStart, SR.ColumnStart, SR.LineEnd, SR.ColumnEnd,
566 Region.getMCDCParams()));
567 } else if (Region.isMCDCDecision()) {
568 MappingRegions.push_back(CounterMappingRegion::makeDecisionRegion(
569 Region.getMCDCDecisionParams(), *CovFileID, SR.LineStart,
570 SR.ColumnStart, SR.LineEnd, SR.ColumnEnd));
571 } else {
572 MappingRegions.push_back(CounterMappingRegion::makeRegion(
573 Region.getCounter(), *CovFileID, SR.LineStart, SR.ColumnStart,
574 SR.LineEnd, SR.ColumnEnd));
575 }
576 }
577 }
578
579 /// Generate expansion regions for each virtual file we've seen.
580 SourceRegionFilter emitExpansionRegions() {
581 SourceRegionFilter Filter;
582 for (const auto &FM : FileIDMapping) {
583 SourceLocation ExpandedLoc = FM.second.second;
584 SourceLocation ParentLoc = getIncludeOrExpansionLoc(ExpandedLoc, false);
585 if (ParentLoc.isInvalid())
586 continue;
587
588 auto ParentFileID = getCoverageFileID(ParentLoc);
589 if (!ParentFileID)
590 continue;
591 auto ExpandedFileID = getCoverageFileID(ExpandedLoc);
592 assert(ExpandedFileID && "expansion in uncovered file");
593
594 SourceLocation LocEnd = getPreciseTokenLocEnd(ParentLoc);
595 assert(SM.isWrittenInSameFile(ParentLoc, LocEnd) &&
596 "region spans multiple files");
597 Filter.insert(std::make_pair(ParentLoc, LocEnd));
598
599 SpellingRegion SR{SM, ParentLoc, LocEnd};
600 assert(SR.isInSourceOrder() && "region start and end out of order");
601 MappingRegions.push_back(CounterMappingRegion::makeExpansion(
602 *ParentFileID, *ExpandedFileID, SR.LineStart, SR.ColumnStart,
603 SR.LineEnd, SR.ColumnEnd));
604 }
605 return Filter;
606 }
607};
608
609/// Creates unreachable coverage regions for the functions that
610/// are not emitted.
611struct EmptyCoverageMappingBuilder : public CoverageMappingBuilder {
612 EmptyCoverageMappingBuilder(CoverageMappingModuleGen &CVM, SourceManager &SM,
613 const LangOptions &LangOpts)
614 : CoverageMappingBuilder(CVM, SM, LangOpts) {}
615
616 void VisitDecl(const Decl *D) {
617 if (!D->hasBody())
618 return;
619 auto Body = D->getBody();
620 SourceLocation Start = getStart(Body);
621 SourceLocation End = getEnd(Body);
622 if (!SM.isWrittenInSameFile(Start, End)) {
623 // Walk up to find the common ancestor.
624 // Correct the locations accordingly.
625 FileID StartFileID = SM.getFileID(Start);
626 FileID EndFileID = SM.getFileID(End);
627 while (StartFileID != EndFileID && !isNestedIn(End, StartFileID)) {
628 Start = getIncludeOrExpansionLoc(Start);
629 assert(Start.isValid() &&
630 "Declaration start location not nested within a known region");
631 StartFileID = SM.getFileID(Start);
632 }
633 while (StartFileID != EndFileID) {
634 End = getPreciseTokenLocEnd(getIncludeOrExpansionLoc(End));
635 assert(End.isValid() &&
636 "Declaration end location not nested within a known region");
637 EndFileID = SM.getFileID(End);
638 }
639 }
640 SourceRegions.emplace_back(Counter(), Start, End);
641 }
642
643 /// Write the mapping data to the output stream
644 void write(llvm::raw_ostream &OS) {
645 SmallVector<unsigned, 16> FileIDMapping;
646 gatherFileIDs(FileIDMapping);
647 emitSourceRegions(SourceRegionFilter());
648
649 if (MappingRegions.empty())
650 return;
651
652 CoverageMappingWriter Writer(FileIDMapping, std::nullopt, MappingRegions);
653 Writer.write(OS);
654 }
655};
656
657/// A wrapper object for maintaining stacks to track the resursive AST visitor
658/// walks for the purpose of assigning IDs to leaf-level conditions measured by
659/// MC/DC. The object is created with a reference to the MCDCBitmapMap that was
660/// created during the initial AST walk. The presence of a bitmap associated
661/// with a boolean expression (top-level logical operator nest) indicates that
662/// the boolean expression qualified for MC/DC. The resulting condition IDs
663/// are preserved in a map reference that is also provided during object
664/// creation.
665struct MCDCCoverageBuilder {
666
667 /// The AST walk recursively visits nested logical-AND or logical-OR binary
668 /// operator nodes and then visits their LHS and RHS children nodes. As this
669 /// happens, the algorithm will assign IDs to each operator's LHS and RHS side
670 /// as the walk moves deeper into the nest. At each level of the recursive
671 /// nest, the LHS and RHS may actually correspond to larger subtrees (not
672 /// leaf-conditions). If this is the case, when that node is visited, the ID
673 /// assigned to the subtree is re-assigned to its LHS, and a new ID is given
674 /// to its RHS. At the end of the walk, all leaf-level conditions will have a
675 /// unique ID -- keep in mind that the final set of IDs may not be in
676 /// numerical order from left to right.
677 ///
678 /// Example: "x = (A && B) || (C && D) || (D && F)"
679 ///
680 /// Visit Depth1:
681 /// (A && B) || (C && D) || (D && F)
682 /// ^-------LHS--------^ ^-RHS--^
683 /// ID=1 ID=2
684 ///
685 /// Visit LHS-Depth2:
686 /// (A && B) || (C && D)
687 /// ^-LHS--^ ^-RHS--^
688 /// ID=1 ID=3
689 ///
690 /// Visit LHS-Depth3:
691 /// (A && B)
692 /// LHS RHS
693 /// ID=1 ID=4
694 ///
695 /// Visit RHS-Depth3:
696 /// (C && D)
697 /// LHS RHS
698 /// ID=3 ID=5
699 ///
700 /// Visit RHS-Depth2: (D && F)
701 /// LHS RHS
702 /// ID=2 ID=6
703 ///
704 /// Visit Depth1:
705 /// (A && B) || (C && D) || (D && F)
706 /// ID=1 ID=4 ID=3 ID=5 ID=2 ID=6
707 ///
708 /// A node ID of '0' always means MC/DC isn't being tracked.
709 ///
710 /// As the AST walk proceeds recursively, the algorithm will also use a stack
711 /// to track the IDs of logical-AND and logical-OR operations on the RHS so
712 /// that it can be determined which nodes are executed next, depending on how
713 /// a LHS or RHS of a logical-AND or logical-OR is evaluated. This
714 /// information relies on the assigned IDs and are embedded within the
715 /// coverage region IDs of each branch region associated with a leaf-level
716 /// condition. This information helps the visualization tool reconstruct all
717 /// possible test vectors for the purposes of MC/DC analysis. If a "next" node
718 /// ID is '0', it means it's the end of the test vector. The following rules
719 /// are used:
720 ///
721 /// For logical-AND ("LHS && RHS"):
722 /// - If LHS is TRUE, execution goes to the RHS node.
723 /// - If LHS is FALSE, execution goes to the LHS node of the next logical-OR.
724 /// If that does not exist, execution exits (ID == 0).
725 ///
726 /// - If RHS is TRUE, execution goes to LHS node of the next logical-AND.
727 /// If that does not exist, execution exits (ID == 0).
728 /// - If RHS is FALSE, execution goes to the LHS node of the next logical-OR.
729 /// If that does not exist, execution exits (ID == 0).
730 ///
731 /// For logical-OR ("LHS || RHS"):
732 /// - If LHS is TRUE, execution goes to the LHS node of the next logical-AND.
733 /// If that does not exist, execution exits (ID == 0).
734 /// - If LHS is FALSE, execution goes to the RHS node.
735 ///
736 /// - If RHS is TRUE, execution goes to LHS node of the next logical-AND.
737 /// If that does not exist, execution exits (ID == 0).
738 /// - If RHS is FALSE, execution goes to the LHS node of the next logical-OR.
739 /// If that does not exist, execution exits (ID == 0).
740 ///
741 /// Finally, the condition IDs are also used when instrumenting the code to
742 /// indicate a unique offset into a temporary bitmap that represents the true
743 /// or false evaluation of that particular condition.
744 ///
745 /// NOTE regarding the use of CodeGenFunction::stripCond(). Even though, for
746 /// simplicity, parentheses and unary logical-NOT operators are considered
747 /// part of their underlying condition for both MC/DC and branch coverage, the
748 /// condition IDs themselves are assigned and tracked using the underlying
749 /// condition itself. This is done solely for consistency since parentheses
750 /// and logical-NOTs are ignored when checking whether the condition is
751 /// actually an instrumentable condition. This can also make debugging a bit
752 /// easier.
753
754private:
755 CodeGenModule &CGM;
756
758 MCDC::State &MCDCState;
759 const Stmt *DecisionStmt = nullptr;
760 mcdc::ConditionID NextID = 0;
761 bool NotMapped = false;
762
763 /// Represent a sentinel value as a pair of final decisions for the bottom
764 // of DecisionStack.
765 static constexpr mcdc::ConditionIDs DecisionStackSentinel{-1, -1};
766
767 /// Is this a logical-AND operation?
768 bool isLAnd(const BinaryOperator *E) const {
769 return E->getOpcode() == BO_LAnd;
770 }
771
772public:
773 MCDCCoverageBuilder(CodeGenModule &CGM, MCDC::State &MCDCState)
774 : CGM(CGM), DecisionStack(1, DecisionStackSentinel),
775 MCDCState(MCDCState) {}
776
777 /// Return whether the build of the control flow map is at the top-level
778 /// (root) of a logical operator nest in a boolean expression prior to the
779 /// assignment of condition IDs.
780 bool isIdle() const { return (NextID == 0 && !NotMapped); }
781
782 /// Return whether any IDs have been assigned in the build of the control
783 /// flow map, indicating that the map is being generated for this boolean
784 /// expression.
785 bool isBuilding() const { return (NextID > 0); }
786
787 /// Set the given condition's ID.
788 void setCondID(const Expr *Cond, mcdc::ConditionID ID) {
789 MCDCState.BranchByStmt[CodeGenFunction::stripCond(Cond)] = {ID,
790 DecisionStmt};
791 }
792
793 /// Return the ID of a given condition.
794 mcdc::ConditionID getCondID(const Expr *Cond) const {
795 auto I = MCDCState.BranchByStmt.find(CodeGenFunction::stripCond(Cond));
796 if (I == MCDCState.BranchByStmt.end())
797 return -1;
798 else
799 return I->second.ID;
800 }
801
802 /// Return the LHS Decision ([0,0] if not set).
803 const mcdc::ConditionIDs &back() const { return DecisionStack.back(); }
804
805 /// Push the binary operator statement to track the nest level and assign IDs
806 /// to the operator's LHS and RHS. The RHS may be a larger subtree that is
807 /// broken up on successive levels.
808 void pushAndAssignIDs(const BinaryOperator *E) {
809 if (!CGM.getCodeGenOpts().MCDCCoverage)
810 return;
811
812 // If binary expression is disqualified, don't do mapping.
813 if (!isBuilding() &&
814 !MCDCState.DecisionByStmt.contains(CodeGenFunction::stripCond(E)))
815 NotMapped = true;
816
817 // Don't go any further if we don't need to map condition IDs.
818 if (NotMapped)
819 return;
820
821 if (NextID == 0) {
822 DecisionStmt = E;
823 assert(MCDCState.DecisionByStmt.contains(E));
824 }
825
826 const mcdc::ConditionIDs &ParentDecision = DecisionStack.back();
827
828 // If the operator itself has an assigned ID, this means it represents a
829 // larger subtree. In this case, assign that ID to its LHS node. Its RHS
830 // will receive a new ID below. Otherwise, assign ID+1 to LHS.
831 if (MCDCState.BranchByStmt.contains(CodeGenFunction::stripCond(E)))
832 setCondID(E->getLHS(), getCondID(E));
833 else
834 setCondID(E->getLHS(), NextID++);
835
836 // Assign a ID+1 for the RHS.
837 mcdc::ConditionID RHSid = NextID++;
838 setCondID(E->getRHS(), RHSid);
839
840 // Push the LHS decision IDs onto the DecisionStack.
841 if (isLAnd(E))
842 DecisionStack.push_back({ParentDecision[false], RHSid});
843 else
844 DecisionStack.push_back({RHSid, ParentDecision[true]});
845 }
846
847 /// Pop and return the LHS Decision ([0,0] if not set).
848 mcdc::ConditionIDs pop() {
849 if (!CGM.getCodeGenOpts().MCDCCoverage || NotMapped)
850 return DecisionStackSentinel;
851
852 assert(DecisionStack.size() > 1);
853 return DecisionStack.pop_back_val();
854 }
855
856 /// Return the total number of conditions and reset the state. The number of
857 /// conditions is zero if the expression isn't mapped.
858 unsigned getTotalConditionsAndReset(const BinaryOperator *E) {
859 if (!CGM.getCodeGenOpts().MCDCCoverage)
860 return 0;
861
862 assert(!isIdle());
863 assert(DecisionStack.size() == 1);
864
865 // Reset state if not doing mapping.
866 if (NotMapped) {
867 NotMapped = false;
868 assert(NextID == 0);
869 return 0;
870 }
871
872 // Set number of conditions and reset.
873 unsigned TotalConds = NextID;
874
875 // Reset ID back to beginning.
876 NextID = 0;
877
878 return TotalConds;
879 }
880};
881
882/// A StmtVisitor that creates coverage mapping regions which map
883/// from the source code locations to the PGO counters.
884struct CounterCoverageMappingBuilder
885 : public CoverageMappingBuilder,
886 public ConstStmtVisitor<CounterCoverageMappingBuilder> {
887 /// The map of statements to count values.
888 llvm::DenseMap<const Stmt *, unsigned> &CounterMap;
889
890 MCDC::State &MCDCState;
891
892 /// A stack of currently live regions.
894
895 /// Set if the Expr should be handled as a leaf even if it is kind of binary
896 /// logical ops (&&, ||).
897 llvm::DenseSet<const Stmt *> LeafExprSet;
898
899 /// An object to manage MCDC regions.
900 MCDCCoverageBuilder MCDCBuilder;
901
902 CounterExpressionBuilder Builder;
903
904 /// A location in the most recently visited file or macro.
905 ///
906 /// This is used to adjust the active source regions appropriately when
907 /// expressions cross file or macro boundaries.
908 SourceLocation MostRecentLocation;
909
910 /// Whether the visitor at a terminate statement.
911 bool HasTerminateStmt = false;
912
913 /// Gap region counter after terminate statement.
914 Counter GapRegionCounter;
915
916 /// Return a counter for the subtraction of \c RHS from \c LHS
917 Counter subtractCounters(Counter LHS, Counter RHS, bool Simplify = true) {
919 "cannot add counters when single byte coverage mode is enabled");
920 return Builder.subtract(LHS, RHS, Simplify);
921 }
922
923 /// Return a counter for the sum of \c LHS and \c RHS.
924 Counter addCounters(Counter LHS, Counter RHS, bool Simplify = true) {
926 "cannot add counters when single byte coverage mode is enabled");
927 return Builder.add(LHS, RHS, Simplify);
928 }
929
930 Counter addCounters(Counter C1, Counter C2, Counter C3,
931 bool Simplify = true) {
933 "cannot add counters when single byte coverage mode is enabled");
934 return addCounters(addCounters(C1, C2, Simplify), C3, Simplify);
935 }
936
937 /// Return the region counter for the given statement.
938 ///
939 /// This should only be called on statements that have a dedicated counter.
940 Counter getRegionCounter(const Stmt *S) {
941 return Counter::getCounter(CounterMap[S]);
942 }
943
944 /// Push a region onto the stack.
945 ///
946 /// Returns the index on the stack where the region was pushed. This can be
947 /// used with popRegions to exit a "scope", ending the region that was pushed.
948 size_t pushRegion(Counter Count,
949 std::optional<SourceLocation> StartLoc = std::nullopt,
950 std::optional<SourceLocation> EndLoc = std::nullopt,
951 std::optional<Counter> FalseCount = std::nullopt,
952 const mcdc::Parameters &BranchParams = std::monostate()) {
953
954 if (StartLoc && !FalseCount) {
955 MostRecentLocation = *StartLoc;
956 }
957
958 // If either of these locations is invalid, something elsewhere in the
959 // compiler has broken.
960 assert((!StartLoc || StartLoc->isValid()) && "Start location is not valid");
961 assert((!EndLoc || EndLoc->isValid()) && "End location is not valid");
962
963 // However, we can still recover without crashing.
964 // If either location is invalid, set it to std::nullopt to avoid
965 // letting users of RegionStack think that region has a valid start/end
966 // location.
967 if (StartLoc && StartLoc->isInvalid())
968 StartLoc = std::nullopt;
969 if (EndLoc && EndLoc->isInvalid())
970 EndLoc = std::nullopt;
971 RegionStack.emplace_back(Count, FalseCount, BranchParams, StartLoc, EndLoc);
972
973 return RegionStack.size() - 1;
974 }
975
976 size_t pushRegion(const mcdc::DecisionParameters &DecisionParams,
977 std::optional<SourceLocation> StartLoc = std::nullopt,
978 std::optional<SourceLocation> EndLoc = std::nullopt) {
979
980 RegionStack.emplace_back(DecisionParams, StartLoc, EndLoc);
981
982 return RegionStack.size() - 1;
983 }
984
985 size_t locationDepth(SourceLocation Loc) {
986 size_t Depth = 0;
987 while (Loc.isValid()) {
988 Loc = getIncludeOrExpansionLoc(Loc);
989 Depth++;
990 }
991 return Depth;
992 }
993
994 /// Pop regions from the stack into the function's list of regions.
995 ///
996 /// Adds all regions from \c ParentIndex to the top of the stack to the
997 /// function's \c SourceRegions.
998 void popRegions(size_t ParentIndex) {
999 assert(RegionStack.size() >= ParentIndex && "parent not in stack");
1000 while (RegionStack.size() > ParentIndex) {
1001 SourceMappingRegion &Region = RegionStack.back();
1002 if (Region.hasStartLoc() &&
1003 (Region.hasEndLoc() || RegionStack[ParentIndex].hasEndLoc())) {
1004 SourceLocation StartLoc = Region.getBeginLoc();
1005 SourceLocation EndLoc = Region.hasEndLoc()
1006 ? Region.getEndLoc()
1007 : RegionStack[ParentIndex].getEndLoc();
1008 bool isBranch = Region.isBranch();
1009 size_t StartDepth = locationDepth(StartLoc);
1010 size_t EndDepth = locationDepth(EndLoc);
1011 while (!SM.isWrittenInSameFile(StartLoc, EndLoc)) {
1012 bool UnnestStart = StartDepth >= EndDepth;
1013 bool UnnestEnd = EndDepth >= StartDepth;
1014 if (UnnestEnd) {
1015 // The region ends in a nested file or macro expansion. If the
1016 // region is not a branch region, create a separate region for each
1017 // expansion, and for all regions, update the EndLoc. Branch
1018 // regions should not be split in order to keep a straightforward
1019 // correspondance between the region and its associated branch
1020 // condition, even if the condition spans multiple depths.
1021 SourceLocation NestedLoc = getStartOfFileOrMacro(EndLoc);
1022 assert(SM.isWrittenInSameFile(NestedLoc, EndLoc));
1023
1024 if (!isBranch && !isRegionAlreadyAdded(NestedLoc, EndLoc))
1025 SourceRegions.emplace_back(Region.getCounter(), NestedLoc,
1026 EndLoc);
1027
1028 EndLoc = getPreciseTokenLocEnd(getIncludeOrExpansionLoc(EndLoc));
1029 if (EndLoc.isInvalid())
1030 llvm::report_fatal_error(
1031 "File exit not handled before popRegions");
1032 EndDepth--;
1033 }
1034 if (UnnestStart) {
1035 // The region ends in a nested file or macro expansion. If the
1036 // region is not a branch region, create a separate region for each
1037 // expansion, and for all regions, update the StartLoc. Branch
1038 // regions should not be split in order to keep a straightforward
1039 // correspondance between the region and its associated branch
1040 // condition, even if the condition spans multiple depths.
1041 SourceLocation NestedLoc = getEndOfFileOrMacro(StartLoc);
1042 assert(SM.isWrittenInSameFile(StartLoc, NestedLoc));
1043
1044 if (!isBranch && !isRegionAlreadyAdded(StartLoc, NestedLoc))
1045 SourceRegions.emplace_back(Region.getCounter(), StartLoc,
1046 NestedLoc);
1047
1048 StartLoc = getIncludeOrExpansionLoc(StartLoc);
1049 if (StartLoc.isInvalid())
1050 llvm::report_fatal_error(
1051 "File exit not handled before popRegions");
1052 StartDepth--;
1053 }
1054 }
1055 Region.setStartLoc(StartLoc);
1056 Region.setEndLoc(EndLoc);
1057
1058 if (!isBranch) {
1059 MostRecentLocation = EndLoc;
1060 // If this region happens to span an entire expansion, we need to
1061 // make sure we don't overlap the parent region with it.
1062 if (StartLoc == getStartOfFileOrMacro(StartLoc) &&
1063 EndLoc == getEndOfFileOrMacro(EndLoc))
1064 MostRecentLocation = getIncludeOrExpansionLoc(EndLoc);
1065 }
1066
1067 assert(SM.isWrittenInSameFile(Region.getBeginLoc(), EndLoc));
1068 assert(SpellingRegion(SM, Region).isInSourceOrder());
1069 SourceRegions.push_back(Region);
1070 }
1071 RegionStack.pop_back();
1072 }
1073 }
1074
1075 /// Return the currently active region.
1076 SourceMappingRegion &getRegion() {
1077 assert(!RegionStack.empty() && "statement has no region");
1078 return RegionStack.back();
1079 }
1080
1081 /// Propagate counts through the children of \p S if \p VisitChildren is true.
1082 /// Otherwise, only emit a count for \p S itself.
1083 Counter propagateCounts(Counter TopCount, const Stmt *S,
1084 bool VisitChildren = true) {
1085 SourceLocation StartLoc = getStart(S);
1086 SourceLocation EndLoc = getEnd(S);
1087 size_t Index = pushRegion(TopCount, StartLoc, EndLoc);
1088 if (VisitChildren)
1089 Visit(S);
1090 Counter ExitCount = getRegion().getCounter();
1091 popRegions(Index);
1092
1093 // The statement may be spanned by an expansion. Make sure we handle a file
1094 // exit out of this expansion before moving to the next statement.
1095 if (SM.isBeforeInTranslationUnit(StartLoc, S->getBeginLoc()))
1096 MostRecentLocation = EndLoc;
1097
1098 return ExitCount;
1099 }
1100
1101 /// Determine whether the given condition can be constant folded.
1102 bool ConditionFoldsToBool(const Expr *Cond) {
1103 Expr::EvalResult Result;
1104 return (Cond->EvaluateAsInt(Result, CVM.getCodeGenModule().getContext()));
1105 }
1106
1107 /// Create a Branch Region around an instrumentable condition for coverage
1108 /// and add it to the function's SourceRegions. A branch region tracks a
1109 /// "True" counter and a "False" counter for boolean expressions that
1110 /// result in the generation of a branch.
1111 void createBranchRegion(const Expr *C, Counter TrueCnt, Counter FalseCnt,
1112 const mcdc::ConditionIDs &Conds = {}) {
1113 // Check for NULL conditions.
1114 if (!C)
1115 return;
1116
1117 // Ensure we are an instrumentable condition (i.e. no "&&" or "||"). Push
1118 // region onto RegionStack but immediately pop it (which adds it to the
1119 // function's SourceRegions) because it doesn't apply to any other source
1120 // code other than the Condition.
1121 // With !SystemHeadersCoverage, binary logical ops in system headers may be
1122 // treated as instrumentable conditions.
1123 if (CodeGenFunction::isInstrumentedCondition(C) ||
1124 LeafExprSet.count(CodeGenFunction::stripCond(C))) {
1125 mcdc::Parameters BranchParams;
1126 mcdc::ConditionID ID = MCDCBuilder.getCondID(C);
1127 if (ID >= 0)
1128 BranchParams = mcdc::BranchParameters{ID, Conds};
1129
1130 // If a condition can fold to true or false, the corresponding branch
1131 // will be removed. Create a region with both counters hard-coded to
1132 // zero. This allows us to visualize them in a special way.
1133 // Alternatively, we can prevent any optimization done via
1134 // constant-folding by ensuring that ConstantFoldsToSimpleInteger() in
1135 // CodeGenFunction.c always returns false, but that is very heavy-handed.
1136 if (ConditionFoldsToBool(C))
1137 popRegions(pushRegion(Counter::getZero(), getStart(C), getEnd(C),
1138 Counter::getZero(), BranchParams));
1139 else
1140 // Otherwise, create a region with the True counter and False counter.
1141 popRegions(pushRegion(TrueCnt, getStart(C), getEnd(C), FalseCnt,
1142 BranchParams));
1143 }
1144 }
1145
1146 /// Create a Decision Region with a BitmapIdx and number of Conditions. This
1147 /// type of region "contains" branch regions, one for each of the conditions.
1148 /// The visualization tool will group everything together.
1149 void createDecisionRegion(const Expr *C,
1150 const mcdc::DecisionParameters &DecisionParams) {
1151 popRegions(pushRegion(DecisionParams, getStart(C), getEnd(C)));
1152 }
1153
1154 /// Create a Branch Region around a SwitchCase for code coverage
1155 /// and add it to the function's SourceRegions.
1156 void createSwitchCaseRegion(const SwitchCase *SC, Counter TrueCnt,
1157 Counter FalseCnt) {
1158 // Push region onto RegionStack but immediately pop it (which adds it to
1159 // the function's SourceRegions) because it doesn't apply to any other
1160 // source other than the SwitchCase.
1161 popRegions(pushRegion(TrueCnt, getStart(SC), SC->getColonLoc(), FalseCnt));
1162 }
1163
1164 /// Check whether a region with bounds \c StartLoc and \c EndLoc
1165 /// is already added to \c SourceRegions.
1166 bool isRegionAlreadyAdded(SourceLocation StartLoc, SourceLocation EndLoc,
1167 bool isBranch = false) {
1168 return llvm::any_of(
1169 llvm::reverse(SourceRegions), [&](const SourceMappingRegion &Region) {
1170 return Region.getBeginLoc() == StartLoc &&
1171 Region.getEndLoc() == EndLoc && Region.isBranch() == isBranch;
1172 });
1173 }
1174
1175 /// Adjust the most recently visited location to \c EndLoc.
1176 ///
1177 /// This should be used after visiting any statements in non-source order.
1178 void adjustForOutOfOrderTraversal(SourceLocation EndLoc) {
1179 MostRecentLocation = EndLoc;
1180 // The code region for a whole macro is created in handleFileExit() when
1181 // it detects exiting of the virtual file of that macro. If we visited
1182 // statements in non-source order, we might already have such a region
1183 // added, for example, if a body of a loop is divided among multiple
1184 // macros. Avoid adding duplicate regions in such case.
1185 if (getRegion().hasEndLoc() &&
1186 MostRecentLocation == getEndOfFileOrMacro(MostRecentLocation) &&
1187 isRegionAlreadyAdded(getStartOfFileOrMacro(MostRecentLocation),
1188 MostRecentLocation, getRegion().isBranch()))
1189 MostRecentLocation = getIncludeOrExpansionLoc(MostRecentLocation);
1190 }
1191
1192 /// Adjust regions and state when \c NewLoc exits a file.
1193 ///
1194 /// If moving from our most recently tracked location to \c NewLoc exits any
1195 /// files, this adjusts our current region stack and creates the file regions
1196 /// for the exited file.
1197 void handleFileExit(SourceLocation NewLoc) {
1198 if (NewLoc.isInvalid() ||
1199 SM.isWrittenInSameFile(MostRecentLocation, NewLoc))
1200 return;
1201
1202 // If NewLoc is not in a file that contains MostRecentLocation, walk up to
1203 // find the common ancestor.
1204 SourceLocation LCA = NewLoc;
1205 FileID ParentFile = SM.getFileID(LCA);
1206 while (!isNestedIn(MostRecentLocation, ParentFile)) {
1207 LCA = getIncludeOrExpansionLoc(LCA);
1208 if (LCA.isInvalid() || SM.isWrittenInSameFile(LCA, MostRecentLocation)) {
1209 // Since there isn't a common ancestor, no file was exited. We just need
1210 // to adjust our location to the new file.
1211 MostRecentLocation = NewLoc;
1212 return;
1213 }
1214 ParentFile = SM.getFileID(LCA);
1215 }
1216
1217 llvm::SmallSet<SourceLocation, 8> StartLocs;
1218 std::optional<Counter> ParentCounter;
1219 for (SourceMappingRegion &I : llvm::reverse(RegionStack)) {
1220 if (!I.hasStartLoc())
1221 continue;
1222 SourceLocation Loc = I.getBeginLoc();
1223 if (!isNestedIn(Loc, ParentFile)) {
1224 ParentCounter = I.getCounter();
1225 break;
1226 }
1227
1228 while (!SM.isInFileID(Loc, ParentFile)) {
1229 // The most nested region for each start location is the one with the
1230 // correct count. We avoid creating redundant regions by stopping once
1231 // we've seen this region.
1232 if (StartLocs.insert(Loc).second) {
1233 if (I.isBranch())
1234 SourceRegions.emplace_back(I.getCounter(), I.getFalseCounter(),
1235 I.getMCDCParams(), Loc,
1236 getEndOfFileOrMacro(Loc), I.isBranch());
1237 else
1238 SourceRegions.emplace_back(I.getCounter(), Loc,
1239 getEndOfFileOrMacro(Loc));
1240 }
1241 Loc = getIncludeOrExpansionLoc(Loc);
1242 }
1243 I.setStartLoc(getPreciseTokenLocEnd(Loc));
1244 }
1245
1246 if (ParentCounter) {
1247 // If the file is contained completely by another region and doesn't
1248 // immediately start its own region, the whole file gets a region
1249 // corresponding to the parent.
1250 SourceLocation Loc = MostRecentLocation;
1251 while (isNestedIn(Loc, ParentFile)) {
1252 SourceLocation FileStart = getStartOfFileOrMacro(Loc);
1253 if (StartLocs.insert(FileStart).second) {
1254 SourceRegions.emplace_back(*ParentCounter, FileStart,
1255 getEndOfFileOrMacro(Loc));
1256 assert(SpellingRegion(SM, SourceRegions.back()).isInSourceOrder());
1257 }
1258 Loc = getIncludeOrExpansionLoc(Loc);
1259 }
1260 }
1261
1262 MostRecentLocation = NewLoc;
1263 }
1264
1265 /// Ensure that \c S is included in the current region.
1266 void extendRegion(const Stmt *S) {
1267 SourceMappingRegion &Region = getRegion();
1268 SourceLocation StartLoc = getStart(S);
1269
1270 handleFileExit(StartLoc);
1271 if (!Region.hasStartLoc())
1272 Region.setStartLoc(StartLoc);
1273 }
1274
1275 /// Mark \c S as a terminator, starting a zero region.
1276 void terminateRegion(const Stmt *S) {
1277 extendRegion(S);
1278 SourceMappingRegion &Region = getRegion();
1279 SourceLocation EndLoc = getEnd(S);
1280 if (!Region.hasEndLoc())
1281 Region.setEndLoc(EndLoc);
1282 pushRegion(Counter::getZero());
1283 HasTerminateStmt = true;
1284 }
1285
1286 /// Find a valid gap range between \p AfterLoc and \p BeforeLoc.
1287 std::optional<SourceRange> findGapAreaBetween(SourceLocation AfterLoc,
1288 SourceLocation BeforeLoc) {
1289 // Some statements (like AttributedStmt and ImplicitValueInitExpr) don't
1290 // have valid source locations. Do not emit a gap region if this is the case
1291 // in either AfterLoc end or BeforeLoc end.
1292 if (AfterLoc.isInvalid() || BeforeLoc.isInvalid())
1293 return std::nullopt;
1294
1295 // If AfterLoc is in function-like macro, use the right parenthesis
1296 // location.
1297 if (AfterLoc.isMacroID()) {
1298 FileID FID = SM.getFileID(AfterLoc);
1299 const SrcMgr::ExpansionInfo *EI = &SM.getSLocEntry(FID).getExpansion();
1300 if (EI->isFunctionMacroExpansion())
1301 AfterLoc = EI->getExpansionLocEnd();
1302 }
1303
1304 size_t StartDepth = locationDepth(AfterLoc);
1305 size_t EndDepth = locationDepth(BeforeLoc);
1306 while (!SM.isWrittenInSameFile(AfterLoc, BeforeLoc)) {
1307 bool UnnestStart = StartDepth >= EndDepth;
1308 bool UnnestEnd = EndDepth >= StartDepth;
1309 if (UnnestEnd) {
1310 assert(SM.isWrittenInSameFile(getStartOfFileOrMacro(BeforeLoc),
1311 BeforeLoc));
1312
1313 BeforeLoc = getIncludeOrExpansionLoc(BeforeLoc);
1314 assert(BeforeLoc.isValid());
1315 EndDepth--;
1316 }
1317 if (UnnestStart) {
1318 assert(SM.isWrittenInSameFile(AfterLoc,
1319 getEndOfFileOrMacro(AfterLoc)));
1320
1321 AfterLoc = getIncludeOrExpansionLoc(AfterLoc);
1322 assert(AfterLoc.isValid());
1323 AfterLoc = getPreciseTokenLocEnd(AfterLoc);
1324 assert(AfterLoc.isValid());
1325 StartDepth--;
1326 }
1327 }
1328 AfterLoc = getPreciseTokenLocEnd(AfterLoc);
1329 // If the start and end locations of the gap are both within the same macro
1330 // file, the range may not be in source order.
1331 if (AfterLoc.isMacroID() || BeforeLoc.isMacroID())
1332 return std::nullopt;
1333 if (!SM.isWrittenInSameFile(AfterLoc, BeforeLoc) ||
1334 !SpellingRegion(SM, AfterLoc, BeforeLoc).isInSourceOrder())
1335 return std::nullopt;
1336 return {{AfterLoc, BeforeLoc}};
1337 }
1338
1339 /// Emit a gap region between \p StartLoc and \p EndLoc with the given count.
1340 void fillGapAreaWithCount(SourceLocation StartLoc, SourceLocation EndLoc,
1341 Counter Count) {
1342 if (StartLoc == EndLoc)
1343 return;
1344 assert(SpellingRegion(SM, StartLoc, EndLoc).isInSourceOrder());
1345 handleFileExit(StartLoc);
1346 size_t Index = pushRegion(Count, StartLoc, EndLoc);
1347 getRegion().setGap(true);
1348 handleFileExit(EndLoc);
1349 popRegions(Index);
1350 }
1351
1352 /// Find a valid range starting with \p StartingLoc and ending before \p
1353 /// BeforeLoc.
1354 std::optional<SourceRange> findAreaStartingFromTo(SourceLocation StartingLoc,
1355 SourceLocation BeforeLoc) {
1356 // If StartingLoc is in function-like macro, use its start location.
1357 if (StartingLoc.isMacroID()) {
1358 FileID FID = SM.getFileID(StartingLoc);
1359 const SrcMgr::ExpansionInfo *EI = &SM.getSLocEntry(FID).getExpansion();
1360 if (EI->isFunctionMacroExpansion())
1361 StartingLoc = EI->getExpansionLocStart();
1362 }
1363
1364 size_t StartDepth = locationDepth(StartingLoc);
1365 size_t EndDepth = locationDepth(BeforeLoc);
1366 while (!SM.isWrittenInSameFile(StartingLoc, BeforeLoc)) {
1367 bool UnnestStart = StartDepth >= EndDepth;
1368 bool UnnestEnd = EndDepth >= StartDepth;
1369 if (UnnestEnd) {
1370 assert(SM.isWrittenInSameFile(getStartOfFileOrMacro(BeforeLoc),
1371 BeforeLoc));
1372
1373 BeforeLoc = getIncludeOrExpansionLoc(BeforeLoc);
1374 assert(BeforeLoc.isValid());
1375 EndDepth--;
1376 }
1377 if (UnnestStart) {
1378 assert(SM.isWrittenInSameFile(StartingLoc,
1379 getStartOfFileOrMacro(StartingLoc)));
1380
1381 StartingLoc = getIncludeOrExpansionLoc(StartingLoc);
1382 assert(StartingLoc.isValid());
1383 StartDepth--;
1384 }
1385 }
1386 // If the start and end locations of the gap are both within the same macro
1387 // file, the range may not be in source order.
1388 if (StartingLoc.isMacroID() || BeforeLoc.isMacroID())
1389 return std::nullopt;
1390 if (!SM.isWrittenInSameFile(StartingLoc, BeforeLoc) ||
1391 !SpellingRegion(SM, StartingLoc, BeforeLoc).isInSourceOrder())
1392 return std::nullopt;
1393 return {{StartingLoc, BeforeLoc}};
1394 }
1395
1396 void markSkipped(SourceLocation StartLoc, SourceLocation BeforeLoc) {
1397 const auto Skipped = findAreaStartingFromTo(StartLoc, BeforeLoc);
1398
1399 if (!Skipped)
1400 return;
1401
1402 const auto NewStartLoc = Skipped->getBegin();
1403 const auto EndLoc = Skipped->getEnd();
1404
1405 if (NewStartLoc == EndLoc)
1406 return;
1407 assert(SpellingRegion(SM, NewStartLoc, EndLoc).isInSourceOrder());
1408 handleFileExit(NewStartLoc);
1409 size_t Index = pushRegion(Counter{}, NewStartLoc, EndLoc);
1410 getRegion().setSkipped(true);
1411 handleFileExit(EndLoc);
1412 popRegions(Index);
1413 }
1414
1415 /// Keep counts of breaks and continues inside loops.
1416 struct BreakContinue {
1417 Counter BreakCount;
1418 Counter ContinueCount;
1419 };
1420 SmallVector<BreakContinue, 8> BreakContinueStack;
1421
1422 CounterCoverageMappingBuilder(
1424 llvm::DenseMap<const Stmt *, unsigned> &CounterMap,
1425 MCDC::State &MCDCState, SourceManager &SM, const LangOptions &LangOpts)
1426 : CoverageMappingBuilder(CVM, SM, LangOpts), CounterMap(CounterMap),
1427 MCDCState(MCDCState), MCDCBuilder(CVM.getCodeGenModule(), MCDCState) {}
1428
1429 /// Write the mapping data to the output stream
1430 void write(llvm::raw_ostream &OS) {
1431 llvm::SmallVector<unsigned, 8> VirtualFileMapping;
1432 gatherFileIDs(VirtualFileMapping);
1433 SourceRegionFilter Filter = emitExpansionRegions();
1434 emitSourceRegions(Filter);
1435 gatherSkippedRegions();
1436
1437 if (MappingRegions.empty())
1438 return;
1439
1440 CoverageMappingWriter Writer(VirtualFileMapping, Builder.getExpressions(),
1441 MappingRegions);
1442 Writer.write(OS);
1443 }
1444
1445 void VisitStmt(const Stmt *S) {
1446 if (S->getBeginLoc().isValid())
1447 extendRegion(S);
1448 const Stmt *LastStmt = nullptr;
1449 bool SaveTerminateStmt = HasTerminateStmt;
1450 HasTerminateStmt = false;
1451 GapRegionCounter = Counter::getZero();
1452 for (const Stmt *Child : S->children())
1453 if (Child) {
1454 // If last statement contains terminate statements, add a gap area
1455 // between the two statements.
1456 if (LastStmt && HasTerminateStmt) {
1457 auto Gap = findGapAreaBetween(getEnd(LastStmt), getStart(Child));
1458 if (Gap)
1459 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(),
1460 GapRegionCounter);
1461 SaveTerminateStmt = true;
1462 HasTerminateStmt = false;
1463 }
1464 this->Visit(Child);
1465 LastStmt = Child;
1466 }
1467 if (SaveTerminateStmt)
1468 HasTerminateStmt = true;
1469 handleFileExit(getEnd(S));
1470 }
1471
1472 void VisitDecl(const Decl *D) {
1473 Stmt *Body = D->getBody();
1474
1475 // Do not propagate region counts into system headers unless collecting
1476 // coverage from system headers is explicitly enabled.
1477 if (!SystemHeadersCoverage && Body &&
1478 SM.isInSystemHeader(SM.getSpellingLoc(getStart(Body))))
1479 return;
1480
1481 // Do not visit the artificial children nodes of defaulted methods. The
1482 // lexer may not be able to report back precise token end locations for
1483 // these children nodes (llvm.org/PR39822), and moreover users will not be
1484 // able to see coverage for them.
1485 Counter BodyCounter = getRegionCounter(Body);
1486 bool Defaulted = false;
1487 if (auto *Method = dyn_cast<CXXMethodDecl>(D))
1488 Defaulted = Method->isDefaulted();
1489 if (auto *Ctor = dyn_cast<CXXConstructorDecl>(D)) {
1490 for (auto *Initializer : Ctor->inits()) {
1491 if (Initializer->isWritten()) {
1492 auto *Init = Initializer->getInit();
1493 if (getStart(Init).isValid() && getEnd(Init).isValid())
1494 propagateCounts(BodyCounter, Init);
1495 }
1496 }
1497 }
1498
1499 propagateCounts(BodyCounter, Body,
1500 /*VisitChildren=*/!Defaulted);
1501 assert(RegionStack.empty() && "Regions entered but never exited");
1502 }
1503
1504 void VisitReturnStmt(const ReturnStmt *S) {
1505 extendRegion(S);
1506 if (S->getRetValue())
1507 Visit(S->getRetValue());
1508 terminateRegion(S);
1509 }
1510
1511 void VisitCoroutineBodyStmt(const CoroutineBodyStmt *S) {
1512 extendRegion(S);
1513 Visit(S->getBody());
1514 }
1515
1516 void VisitCoreturnStmt(const CoreturnStmt *S) {
1517 extendRegion(S);
1518 if (S->getOperand())
1519 Visit(S->getOperand());
1520 terminateRegion(S);
1521 }
1522
1523 void VisitCoroutineSuspendExpr(const CoroutineSuspendExpr *E) {
1524 Visit(E->getOperand());
1525 }
1526
1527 void VisitCXXThrowExpr(const CXXThrowExpr *E) {
1528 extendRegion(E);
1529 if (E->getSubExpr())
1530 Visit(E->getSubExpr());
1531 terminateRegion(E);
1532 }
1533
1534 void VisitGotoStmt(const GotoStmt *S) { terminateRegion(S); }
1535
1536 void VisitLabelStmt(const LabelStmt *S) {
1537 Counter LabelCount = getRegionCounter(S);
1538 SourceLocation Start = getStart(S);
1539 // We can't extendRegion here or we risk overlapping with our new region.
1540 handleFileExit(Start);
1541 pushRegion(LabelCount, Start);
1542 Visit(S->getSubStmt());
1543 }
1544
1545 void VisitBreakStmt(const BreakStmt *S) {
1546 assert(!BreakContinueStack.empty() && "break not in a loop or switch!");
1548 BreakContinueStack.back().BreakCount = addCounters(
1549 BreakContinueStack.back().BreakCount, getRegion().getCounter());
1550 // FIXME: a break in a switch should terminate regions for all preceding
1551 // case statements, not just the most recent one.
1552 terminateRegion(S);
1553 }
1554
1555 void VisitContinueStmt(const ContinueStmt *S) {
1556 assert(!BreakContinueStack.empty() && "continue stmt not in a loop!");
1558 BreakContinueStack.back().ContinueCount = addCounters(
1559 BreakContinueStack.back().ContinueCount, getRegion().getCounter());
1560 terminateRegion(S);
1561 }
1562
1563 void VisitCallExpr(const CallExpr *E) {
1564 VisitStmt(E);
1565
1566 // Terminate the region when we hit a noreturn function.
1567 // (This is helpful dealing with switch statements.)
1568 QualType CalleeType = E->getCallee()->getType();
1569 if (getFunctionExtInfo(*CalleeType).getNoReturn())
1570 terminateRegion(E);
1571 }
1572
1573 void VisitWhileStmt(const WhileStmt *S) {
1574 extendRegion(S);
1575
1576 Counter ParentCount = getRegion().getCounter();
1577 Counter BodyCount = llvm::EnableSingleByteCoverage
1578 ? getRegionCounter(S->getBody())
1579 : getRegionCounter(S);
1580
1581 // Handle the body first so that we can get the backedge count.
1582 BreakContinueStack.push_back(BreakContinue());
1583 extendRegion(S->getBody());
1584 Counter BackedgeCount = propagateCounts(BodyCount, S->getBody());
1585 BreakContinue BC = BreakContinueStack.pop_back_val();
1586
1587 bool BodyHasTerminateStmt = HasTerminateStmt;
1588 HasTerminateStmt = false;
1589
1590 // Go back to handle the condition.
1591 Counter CondCount =
1593 ? getRegionCounter(S->getCond())
1594 : addCounters(ParentCount, BackedgeCount, BC.ContinueCount);
1595 propagateCounts(CondCount, S->getCond());
1596 adjustForOutOfOrderTraversal(getEnd(S));
1597
1598 // The body count applies to the area immediately after the increment.
1599 auto Gap = findGapAreaBetween(S->getRParenLoc(), getStart(S->getBody()));
1600 if (Gap)
1601 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(), BodyCount);
1602
1603 Counter OutCount =
1605 ? getRegionCounter(S)
1606 : addCounters(BC.BreakCount,
1607 subtractCounters(CondCount, BodyCount));
1608
1609 if (OutCount != ParentCount) {
1610 pushRegion(OutCount);
1611 GapRegionCounter = OutCount;
1612 if (BodyHasTerminateStmt)
1613 HasTerminateStmt = true;
1614 }
1615
1616 // Create Branch Region around condition.
1618 createBranchRegion(S->getCond(), BodyCount,
1619 subtractCounters(CondCount, BodyCount));
1620 }
1621
1622 void VisitDoStmt(const DoStmt *S) {
1623 extendRegion(S);
1624
1625 Counter ParentCount = getRegion().getCounter();
1626 Counter BodyCount = llvm::EnableSingleByteCoverage
1627 ? getRegionCounter(S->getBody())
1628 : getRegionCounter(S);
1629
1630 BreakContinueStack.push_back(BreakContinue());
1631 extendRegion(S->getBody());
1632
1633 Counter BackedgeCount;
1635 propagateCounts(BodyCount, S->getBody());
1636 else
1637 BackedgeCount =
1638 propagateCounts(addCounters(ParentCount, BodyCount), S->getBody());
1639
1640 BreakContinue BC = BreakContinueStack.pop_back_val();
1641
1642 bool BodyHasTerminateStmt = HasTerminateStmt;
1643 HasTerminateStmt = false;
1644
1645 Counter CondCount = llvm::EnableSingleByteCoverage
1646 ? getRegionCounter(S->getCond())
1647 : addCounters(BackedgeCount, BC.ContinueCount);
1648 propagateCounts(CondCount, S->getCond());
1649
1650 Counter OutCount =
1652 ? getRegionCounter(S)
1653 : addCounters(BC.BreakCount,
1654 subtractCounters(CondCount, BodyCount));
1655 if (OutCount != ParentCount) {
1656 pushRegion(OutCount);
1657 GapRegionCounter = OutCount;
1658 }
1659
1660 // Create Branch Region around condition.
1662 createBranchRegion(S->getCond(), BodyCount,
1663 subtractCounters(CondCount, BodyCount));
1664
1665 if (BodyHasTerminateStmt)
1666 HasTerminateStmt = true;
1667 }
1668
1669 void VisitForStmt(const ForStmt *S) {
1670 extendRegion(S);
1671 if (S->getInit())
1672 Visit(S->getInit());
1673
1674 Counter ParentCount = getRegion().getCounter();
1675 Counter BodyCount = llvm::EnableSingleByteCoverage
1676 ? getRegionCounter(S->getBody())
1677 : getRegionCounter(S);
1678
1679 // The loop increment may contain a break or continue.
1680 if (S->getInc())
1681 BreakContinueStack.emplace_back();
1682
1683 // Handle the body first so that we can get the backedge count.
1684 BreakContinueStack.emplace_back();
1685 extendRegion(S->getBody());
1686 Counter BackedgeCount = propagateCounts(BodyCount, S->getBody());
1687 BreakContinue BodyBC = BreakContinueStack.pop_back_val();
1688
1689 bool BodyHasTerminateStmt = HasTerminateStmt;
1690 HasTerminateStmt = false;
1691
1692 // The increment is essentially part of the body but it needs to include
1693 // the count for all the continue statements.
1694 BreakContinue IncrementBC;
1695 if (const Stmt *Inc = S->getInc()) {
1696 Counter IncCount;
1698 IncCount = getRegionCounter(S->getInc());
1699 else
1700 IncCount = addCounters(BackedgeCount, BodyBC.ContinueCount);
1701 propagateCounts(IncCount, Inc);
1702 IncrementBC = BreakContinueStack.pop_back_val();
1703 }
1704
1705 // Go back to handle the condition.
1706 Counter CondCount =
1708 ? getRegionCounter(S->getCond())
1709 : addCounters(
1710 addCounters(ParentCount, BackedgeCount, BodyBC.ContinueCount),
1711 IncrementBC.ContinueCount);
1712
1713 if (const Expr *Cond = S->getCond()) {
1714 propagateCounts(CondCount, Cond);
1715 adjustForOutOfOrderTraversal(getEnd(S));
1716 }
1717
1718 // The body count applies to the area immediately after the increment.
1719 auto Gap = findGapAreaBetween(S->getRParenLoc(), getStart(S->getBody()));
1720 if (Gap)
1721 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(), BodyCount);
1722
1723 Counter OutCount =
1725 ? getRegionCounter(S)
1726 : addCounters(BodyBC.BreakCount, IncrementBC.BreakCount,
1727 subtractCounters(CondCount, BodyCount));
1728 if (OutCount != ParentCount) {
1729 pushRegion(OutCount);
1730 GapRegionCounter = OutCount;
1731 if (BodyHasTerminateStmt)
1732 HasTerminateStmt = true;
1733 }
1734
1735 // Create Branch Region around condition.
1737 createBranchRegion(S->getCond(), BodyCount,
1738 subtractCounters(CondCount, BodyCount));
1739 }
1740
1741 void VisitCXXForRangeStmt(const CXXForRangeStmt *S) {
1742 extendRegion(S);
1743 if (S->getInit())
1744 Visit(S->getInit());
1745 Visit(S->getLoopVarStmt());
1746 Visit(S->getRangeStmt());
1747
1748 Counter ParentCount = getRegion().getCounter();
1749 Counter BodyCount = llvm::EnableSingleByteCoverage
1750 ? getRegionCounter(S->getBody())
1751 : getRegionCounter(S);
1752
1753 BreakContinueStack.push_back(BreakContinue());
1754 extendRegion(S->getBody());
1755 Counter BackedgeCount = propagateCounts(BodyCount, S->getBody());
1756 BreakContinue BC = BreakContinueStack.pop_back_val();
1757
1758 bool BodyHasTerminateStmt = HasTerminateStmt;
1759 HasTerminateStmt = false;
1760
1761 // The body count applies to the area immediately after the range.
1762 auto Gap = findGapAreaBetween(S->getRParenLoc(), getStart(S->getBody()));
1763 if (Gap)
1764 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(), BodyCount);
1765
1766 Counter OutCount;
1767 Counter LoopCount;
1769 OutCount = getRegionCounter(S);
1770 else {
1771 LoopCount = addCounters(ParentCount, BackedgeCount, BC.ContinueCount);
1772 OutCount =
1773 addCounters(BC.BreakCount, subtractCounters(LoopCount, BodyCount));
1774 }
1775 if (OutCount != ParentCount) {
1776 pushRegion(OutCount);
1777 GapRegionCounter = OutCount;
1778 if (BodyHasTerminateStmt)
1779 HasTerminateStmt = true;
1780 }
1781
1782 // Create Branch Region around condition.
1784 createBranchRegion(S->getCond(), BodyCount,
1785 subtractCounters(LoopCount, BodyCount));
1786 }
1787
1788 void VisitObjCForCollectionStmt(const ObjCForCollectionStmt *S) {
1789 extendRegion(S);
1790 Visit(S->getElement());
1791
1792 Counter ParentCount = getRegion().getCounter();
1793 Counter BodyCount = getRegionCounter(S);
1794
1795 BreakContinueStack.push_back(BreakContinue());
1796 extendRegion(S->getBody());
1797 Counter BackedgeCount = propagateCounts(BodyCount, S->getBody());
1798 BreakContinue BC = BreakContinueStack.pop_back_val();
1799
1800 // The body count applies to the area immediately after the collection.
1801 auto Gap = findGapAreaBetween(S->getRParenLoc(), getStart(S->getBody()));
1802 if (Gap)
1803 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(), BodyCount);
1804
1805 Counter LoopCount =
1806 addCounters(ParentCount, BackedgeCount, BC.ContinueCount);
1807 Counter OutCount =
1808 addCounters(BC.BreakCount, subtractCounters(LoopCount, BodyCount));
1809 if (OutCount != ParentCount) {
1810 pushRegion(OutCount);
1811 GapRegionCounter = OutCount;
1812 }
1813 }
1814
1815 void VisitSwitchStmt(const SwitchStmt *S) {
1816 extendRegion(S);
1817 if (S->getInit())
1818 Visit(S->getInit());
1819 Visit(S->getCond());
1820
1821 BreakContinueStack.push_back(BreakContinue());
1822
1823 const Stmt *Body = S->getBody();
1824 extendRegion(Body);
1825 if (const auto *CS = dyn_cast<CompoundStmt>(Body)) {
1826 if (!CS->body_empty()) {
1827 // Make a region for the body of the switch. If the body starts with
1828 // a case, that case will reuse this region; otherwise, this covers
1829 // the unreachable code at the beginning of the switch body.
1830 size_t Index = pushRegion(Counter::getZero(), getStart(CS));
1831 getRegion().setGap(true);
1832 Visit(Body);
1833
1834 // Set the end for the body of the switch, if it isn't already set.
1835 for (size_t i = RegionStack.size(); i != Index; --i) {
1836 if (!RegionStack[i - 1].hasEndLoc())
1837 RegionStack[i - 1].setEndLoc(getEnd(CS->body_back()));
1838 }
1839
1840 popRegions(Index);
1841 }
1842 } else
1843 propagateCounts(Counter::getZero(), Body);
1844 BreakContinue BC = BreakContinueStack.pop_back_val();
1845
1846 if (!BreakContinueStack.empty() && !llvm::EnableSingleByteCoverage)
1847 BreakContinueStack.back().ContinueCount = addCounters(
1848 BreakContinueStack.back().ContinueCount, BC.ContinueCount);
1849
1850 Counter ParentCount = getRegion().getCounter();
1851 Counter ExitCount = getRegionCounter(S);
1852 SourceLocation ExitLoc = getEnd(S);
1853 pushRegion(ExitCount);
1854 GapRegionCounter = ExitCount;
1855
1856 // Ensure that handleFileExit recognizes when the end location is located
1857 // in a different file.
1858 MostRecentLocation = getStart(S);
1859 handleFileExit(ExitLoc);
1860
1861 // When single byte coverage mode is enabled, do not create branch region by
1862 // early returning.
1864 return;
1865
1866 // Create a Branch Region around each Case. Subtract the case's
1867 // counter from the Parent counter to track the "False" branch count.
1868 Counter CaseCountSum;
1869 bool HasDefaultCase = false;
1870 const SwitchCase *Case = S->getSwitchCaseList();
1871 for (; Case; Case = Case->getNextSwitchCase()) {
1872 HasDefaultCase = HasDefaultCase || isa<DefaultStmt>(Case);
1873 CaseCountSum =
1874 addCounters(CaseCountSum, getRegionCounter(Case), /*Simplify=*/false);
1875 createSwitchCaseRegion(
1876 Case, getRegionCounter(Case),
1877 subtractCounters(ParentCount, getRegionCounter(Case)));
1878 }
1879 // Simplify is skipped while building the counters above: it can get really
1880 // slow on top of switches with thousands of cases. Instead, trigger
1881 // simplification by adding zero to the last counter.
1882 CaseCountSum = addCounters(CaseCountSum, Counter::getZero());
1883
1884 // If no explicit default case exists, create a branch region to represent
1885 // the hidden branch, which will be added later by the CodeGen. This region
1886 // will be associated with the switch statement's condition.
1887 if (!HasDefaultCase) {
1888 Counter DefaultTrue = subtractCounters(ParentCount, CaseCountSum);
1889 Counter DefaultFalse = subtractCounters(ParentCount, DefaultTrue);
1890 createBranchRegion(S->getCond(), DefaultTrue, DefaultFalse);
1891 }
1892 }
1893
1894 void VisitSwitchCase(const SwitchCase *S) {
1895 extendRegion(S);
1896
1897 SourceMappingRegion &Parent = getRegion();
1898 Counter Count = llvm::EnableSingleByteCoverage
1899 ? getRegionCounter(S)
1900 : addCounters(Parent.getCounter(), getRegionCounter(S));
1901
1902 // Reuse the existing region if it starts at our label. This is typical of
1903 // the first case in a switch.
1904 if (Parent.hasStartLoc() && Parent.getBeginLoc() == getStart(S))
1905 Parent.setCounter(Count);
1906 else
1907 pushRegion(Count, getStart(S));
1908
1909 GapRegionCounter = Count;
1910
1911 if (const auto *CS = dyn_cast<CaseStmt>(S)) {
1912 Visit(CS->getLHS());
1913 if (const Expr *RHS = CS->getRHS())
1914 Visit(RHS);
1915 }
1916 Visit(S->getSubStmt());
1917 }
1918
1919 void coverIfConsteval(const IfStmt *S) {
1920 assert(S->isConsteval());
1921
1922 const auto *Then = S->getThen();
1923 const auto *Else = S->getElse();
1924
1925 // It's better for llvm-cov to create a new region with same counter
1926 // so line-coverage can be properly calculated for lines containing
1927 // a skipped region (without it the line is marked uncovered)
1928 const Counter ParentCount = getRegion().getCounter();
1929
1930 extendRegion(S);
1931
1932 if (S->isNegatedConsteval()) {
1933 // ignore 'if consteval'
1934 markSkipped(S->getIfLoc(), getStart(Then));
1935 propagateCounts(ParentCount, Then);
1936
1937 if (Else) {
1938 // ignore 'else <else>'
1939 markSkipped(getEnd(Then), getEnd(Else));
1940 }
1941 } else {
1942 assert(S->isNonNegatedConsteval());
1943 // ignore 'if consteval <then> [else]'
1944 markSkipped(S->getIfLoc(), Else ? getStart(Else) : getEnd(Then));
1945
1946 if (Else)
1947 propagateCounts(ParentCount, Else);
1948 }
1949 }
1950
1951 void coverIfConstexpr(const IfStmt *S) {
1952 assert(S->isConstexpr());
1953
1954 // evaluate constant condition...
1955 const bool isTrue =
1956 S->getCond()
1957 ->EvaluateKnownConstInt(CVM.getCodeGenModule().getContext())
1958 .getBoolValue();
1959
1960 extendRegion(S);
1961
1962 // I'm using 'propagateCounts' later as new region is better and allows me
1963 // to properly calculate line coverage in llvm-cov utility
1964 const Counter ParentCount = getRegion().getCounter();
1965
1966 // ignore 'if constexpr ('
1967 SourceLocation startOfSkipped = S->getIfLoc();
1968
1969 if (const auto *Init = S->getInit()) {
1970 const auto start = getStart(Init);
1971 const auto end = getEnd(Init);
1972
1973 // this check is to make sure typedef here which doesn't have valid source
1974 // location won't crash it
1975 if (start.isValid() && end.isValid()) {
1976 markSkipped(startOfSkipped, start);
1977 propagateCounts(ParentCount, Init);
1978 startOfSkipped = getEnd(Init);
1979 }
1980 }
1981
1982 const auto *Then = S->getThen();
1983 const auto *Else = S->getElse();
1984
1985 if (isTrue) {
1986 // ignore '<condition>)'
1987 markSkipped(startOfSkipped, getStart(Then));
1988 propagateCounts(ParentCount, Then);
1989
1990 if (Else)
1991 // ignore 'else <else>'
1992 markSkipped(getEnd(Then), getEnd(Else));
1993 } else {
1994 // ignore '<condition>) <then> [else]'
1995 markSkipped(startOfSkipped, Else ? getStart(Else) : getEnd(Then));
1996
1997 if (Else)
1998 propagateCounts(ParentCount, Else);
1999 }
2000 }
2001
2002 void VisitIfStmt(const IfStmt *S) {
2003 // "if constexpr" and "if consteval" are not normal conditional statements,
2004 // their discarded statement should be skipped
2005 if (S->isConsteval())
2006 return coverIfConsteval(S);
2007 else if (S->isConstexpr())
2008 return coverIfConstexpr(S);
2009
2010 extendRegion(S);
2011 if (S->getInit())
2012 Visit(S->getInit());
2013
2014 // Extend into the condition before we propagate through it below - this is
2015 // needed to handle macros that generate the "if" but not the condition.
2016 extendRegion(S->getCond());
2017
2018 Counter ParentCount = getRegion().getCounter();
2019 Counter ThenCount = llvm::EnableSingleByteCoverage
2020 ? getRegionCounter(S->getThen())
2021 : getRegionCounter(S);
2022
2023 // Emitting a counter for the condition makes it easier to interpret the
2024 // counter for the body when looking at the coverage.
2025 propagateCounts(ParentCount, S->getCond());
2026
2027 // The 'then' count applies to the area immediately after the condition.
2028 std::optional<SourceRange> Gap =
2029 findGapAreaBetween(S->getRParenLoc(), getStart(S->getThen()));
2030 if (Gap)
2031 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(), ThenCount);
2032
2033 extendRegion(S->getThen());
2034 Counter OutCount = propagateCounts(ThenCount, S->getThen());
2035
2036 Counter ElseCount;
2038 ElseCount = subtractCounters(ParentCount, ThenCount);
2039 else if (S->getElse())
2040 ElseCount = getRegionCounter(S->getElse());
2041
2042 if (const Stmt *Else = S->getElse()) {
2043 bool ThenHasTerminateStmt = HasTerminateStmt;
2044 HasTerminateStmt = false;
2045 // The 'else' count applies to the area immediately after the 'then'.
2046 std::optional<SourceRange> Gap =
2047 findGapAreaBetween(getEnd(S->getThen()), getStart(Else));
2048 if (Gap)
2049 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(), ElseCount);
2050 extendRegion(Else);
2051
2052 Counter ElseOutCount = propagateCounts(ElseCount, Else);
2054 OutCount = addCounters(OutCount, ElseOutCount);
2055
2056 if (ThenHasTerminateStmt)
2057 HasTerminateStmt = true;
2059 OutCount = addCounters(OutCount, ElseCount);
2060
2062 OutCount = getRegionCounter(S);
2063
2064 if (OutCount != ParentCount) {
2065 pushRegion(OutCount);
2066 GapRegionCounter = OutCount;
2067 }
2068
2069 if (!S->isConsteval() && !llvm::EnableSingleByteCoverage)
2070 // Create Branch Region around condition.
2071 createBranchRegion(S->getCond(), ThenCount,
2072 subtractCounters(ParentCount, ThenCount));
2073 }
2074
2075 void VisitCXXTryStmt(const CXXTryStmt *S) {
2076 extendRegion(S);
2077 // Handle macros that generate the "try" but not the rest.
2078 extendRegion(S->getTryBlock());
2079
2080 Counter ParentCount = getRegion().getCounter();
2081 propagateCounts(ParentCount, S->getTryBlock());
2082
2083 for (unsigned I = 0, E = S->getNumHandlers(); I < E; ++I)
2084 Visit(S->getHandler(I));
2085
2086 Counter ExitCount = getRegionCounter(S);
2087 pushRegion(ExitCount);
2088 }
2089
2090 void VisitCXXCatchStmt(const CXXCatchStmt *S) {
2091 propagateCounts(getRegionCounter(S), S->getHandlerBlock());
2092 }
2093
2094 void VisitAbstractConditionalOperator(const AbstractConditionalOperator *E) {
2095 extendRegion(E);
2096
2097 Counter ParentCount = getRegion().getCounter();
2098 Counter TrueCount = llvm::EnableSingleByteCoverage
2099 ? getRegionCounter(E->getTrueExpr())
2100 : getRegionCounter(E);
2101 Counter OutCount;
2102
2103 if (const auto *BCO = dyn_cast<BinaryConditionalOperator>(E)) {
2104 propagateCounts(ParentCount, BCO->getCommon());
2105 OutCount = TrueCount;
2106 } else {
2107 propagateCounts(ParentCount, E->getCond());
2108 // The 'then' count applies to the area immediately after the condition.
2109 auto Gap =
2110 findGapAreaBetween(E->getQuestionLoc(), getStart(E->getTrueExpr()));
2111 if (Gap)
2112 fillGapAreaWithCount(Gap->getBegin(), Gap->getEnd(), TrueCount);
2113
2114 extendRegion(E->getTrueExpr());
2115 OutCount = propagateCounts(TrueCount, E->getTrueExpr());
2116 }
2117
2118 extendRegion(E->getFalseExpr());
2119 Counter FalseCount = llvm::EnableSingleByteCoverage
2120 ? getRegionCounter(E->getFalseExpr())
2121 : subtractCounters(ParentCount, TrueCount);
2122
2123 Counter FalseOutCount = propagateCounts(FalseCount, E->getFalseExpr());
2125 OutCount = getRegionCounter(E);
2126 else
2127 OutCount = addCounters(OutCount, FalseOutCount);
2128
2129 if (OutCount != ParentCount) {
2130 pushRegion(OutCount);
2131 GapRegionCounter = OutCount;
2132 }
2133
2134 // Create Branch Region around condition.
2136 createBranchRegion(E->getCond(), TrueCount,
2137 subtractCounters(ParentCount, TrueCount));
2138 }
2139
2140 void createOrCancelDecision(const BinaryOperator *E, unsigned Since) {
2141 unsigned NumConds = MCDCBuilder.getTotalConditionsAndReset(E);
2142 if (NumConds == 0)
2143 return;
2144
2145 // Extract [ID, Conds] to construct the graph.
2146 llvm::SmallVector<mcdc::ConditionIDs> CondIDs(NumConds);
2147 for (const auto &SR : ArrayRef(SourceRegions).slice(Since)) {
2148 if (SR.isMCDCBranch()) {
2149 auto [ID, Conds] = SR.getMCDCBranchParams();
2150 CondIDs[ID] = Conds;
2151 }
2152 }
2153
2154 // Construct the graph and calculate `Indices`.
2155 mcdc::TVIdxBuilder Builder(CondIDs);
2156 unsigned NumTVs = Builder.NumTestVectors;
2157 unsigned MaxTVs = CVM.getCodeGenModule().getCodeGenOpts().MCDCMaxTVs;
2158 assert(MaxTVs < mcdc::TVIdxBuilder::HardMaxTVs);
2159
2160 if (NumTVs > MaxTVs) {
2161 // NumTVs exceeds MaxTVs -- warn and cancel the Decision.
2162 cancelDecision(E, Since, NumTVs, MaxTVs);
2163 return;
2164 }
2165
2166 // Update the state for CodeGenPGO
2167 assert(MCDCState.DecisionByStmt.contains(E));
2168 MCDCState.DecisionByStmt[E] = {
2169 MCDCState.BitmapBits, // Top
2170 std::move(Builder.Indices),
2171 };
2172
2173 auto DecisionParams = mcdc::DecisionParameters{
2174 MCDCState.BitmapBits += NumTVs, // Tail
2175 NumConds,
2176 };
2177
2178 // Create MCDC Decision Region.
2179 createDecisionRegion(E, DecisionParams);
2180 }
2181
2182 // Warn and cancel the Decision.
2183 void cancelDecision(const BinaryOperator *E, unsigned Since, int NumTVs,
2184 int MaxTVs) {
2185 auto &Diag = CVM.getCodeGenModule().getDiags();
2186 unsigned DiagID =
2187 Diag.getCustomDiagID(DiagnosticsEngine::Warning,
2188 "unsupported MC/DC boolean expression; "
2189 "number of test vectors (%0) exceeds max (%1). "
2190 "Expression will not be covered");
2191 Diag.Report(E->getBeginLoc(), DiagID) << NumTVs << MaxTVs;
2192
2193 // Restore MCDCBranch to Branch.
2194 for (auto &SR : MutableArrayRef(SourceRegions).slice(Since)) {
2195 assert(!SR.isMCDCDecision() && "Decision shouldn't be seen here");
2196 if (SR.isMCDCBranch())
2197 SR.resetMCDCParams();
2198 }
2199
2200 // Tell CodeGenPGO not to instrument.
2201 MCDCState.DecisionByStmt.erase(E);
2202 }
2203
2204 /// Check if E belongs to system headers.
2205 bool isExprInSystemHeader(const BinaryOperator *E) const {
2206 return (!SystemHeadersCoverage &&
2207 SM.isInSystemHeader(SM.getSpellingLoc(E->getOperatorLoc())) &&
2208 SM.isInSystemHeader(SM.getSpellingLoc(E->getBeginLoc())) &&
2209 SM.isInSystemHeader(SM.getSpellingLoc(E->getEndLoc())));
2210 }
2211
2212 void VisitBinLAnd(const BinaryOperator *E) {
2213 if (isExprInSystemHeader(E)) {
2214 LeafExprSet.insert(E);
2215 return;
2216 }
2217
2218 bool IsRootNode = MCDCBuilder.isIdle();
2219
2220 unsigned SourceRegionsSince = SourceRegions.size();
2221
2222 // Keep track of Binary Operator and assign MCDC condition IDs.
2223 MCDCBuilder.pushAndAssignIDs(E);
2224
2225 extendRegion(E->getLHS());
2226 propagateCounts(getRegion().getCounter(), E->getLHS());
2227 handleFileExit(getEnd(E->getLHS()));
2228
2229 // Track LHS True/False Decision.
2230 const auto DecisionLHS = MCDCBuilder.pop();
2231
2232 // Counter tracks the right hand side of a logical and operator.
2233 extendRegion(E->getRHS());
2234 propagateCounts(getRegionCounter(E), E->getRHS());
2235
2236 // Track RHS True/False Decision.
2237 const auto DecisionRHS = MCDCBuilder.back();
2238
2239 // Extract the RHS's Execution Counter.
2240 Counter RHSExecCnt = getRegionCounter(E);
2241
2242 // Extract the RHS's "True" Instance Counter.
2243 Counter RHSTrueCnt = getRegionCounter(E->getRHS());
2244
2245 // Extract the Parent Region Counter.
2246 Counter ParentCnt = getRegion().getCounter();
2247
2248 // Create Branch Region around LHS condition.
2250 createBranchRegion(E->getLHS(), RHSExecCnt,
2251 subtractCounters(ParentCnt, RHSExecCnt), DecisionLHS);
2252
2253 // Create Branch Region around RHS condition.
2255 createBranchRegion(E->getRHS(), RHSTrueCnt,
2256 subtractCounters(RHSExecCnt, RHSTrueCnt), DecisionRHS);
2257
2258 // Create MCDC Decision Region if at top-level (root).
2259 if (IsRootNode)
2260 createOrCancelDecision(E, SourceRegionsSince);
2261 }
2262
2263 // Determine whether the right side of OR operation need to be visited.
2264 bool shouldVisitRHS(const Expr *LHS) {
2265 bool LHSIsTrue = false;
2266 bool LHSIsConst = false;
2267 if (!LHS->isValueDependent())
2268 LHSIsConst = LHS->EvaluateAsBooleanCondition(
2269 LHSIsTrue, CVM.getCodeGenModule().getContext());
2270 return !LHSIsConst || (LHSIsConst && !LHSIsTrue);
2271 }
2272
2273 void VisitBinLOr(const BinaryOperator *E) {
2274 if (isExprInSystemHeader(E)) {
2275 LeafExprSet.insert(E);
2276 return;
2277 }
2278
2279 bool IsRootNode = MCDCBuilder.isIdle();
2280
2281 unsigned SourceRegionsSince = SourceRegions.size();
2282
2283 // Keep track of Binary Operator and assign MCDC condition IDs.
2284 MCDCBuilder.pushAndAssignIDs(E);
2285
2286 extendRegion(E->getLHS());
2287 Counter OutCount = propagateCounts(getRegion().getCounter(), E->getLHS());
2288 handleFileExit(getEnd(E->getLHS()));
2289
2290 // Track LHS True/False Decision.
2291 const auto DecisionLHS = MCDCBuilder.pop();
2292
2293 // Counter tracks the right hand side of a logical or operator.
2294 extendRegion(E->getRHS());
2295 propagateCounts(getRegionCounter(E), E->getRHS());
2296
2297 // Track RHS True/False Decision.
2298 const auto DecisionRHS = MCDCBuilder.back();
2299
2300 // Extract the RHS's Execution Counter.
2301 Counter RHSExecCnt = getRegionCounter(E);
2302
2303 // Extract the RHS's "False" Instance Counter.
2304 Counter RHSFalseCnt = getRegionCounter(E->getRHS());
2305
2306 if (!shouldVisitRHS(E->getLHS())) {
2307 GapRegionCounter = OutCount;
2308 }
2309
2310 // Extract the Parent Region Counter.
2311 Counter ParentCnt = getRegion().getCounter();
2312
2313 // Create Branch Region around LHS condition.
2315 createBranchRegion(E->getLHS(), subtractCounters(ParentCnt, RHSExecCnt),
2316 RHSExecCnt, DecisionLHS);
2317
2318 // Create Branch Region around RHS condition.
2320 createBranchRegion(E->getRHS(), subtractCounters(RHSExecCnt, RHSFalseCnt),
2321 RHSFalseCnt, DecisionRHS);
2322
2323 // Create MCDC Decision Region if at top-level (root).
2324 if (IsRootNode)
2325 createOrCancelDecision(E, SourceRegionsSince);
2326 }
2327
2328 void VisitLambdaExpr(const LambdaExpr *LE) {
2329 // Lambdas are treated as their own functions for now, so we shouldn't
2330 // propagate counts into them.
2331 }
2332
2333 void VisitArrayInitLoopExpr(const ArrayInitLoopExpr *AILE) {
2334 Visit(AILE->getCommonExpr()->getSourceExpr());
2335 }
2336
2337 void VisitPseudoObjectExpr(const PseudoObjectExpr *POE) {
2338 // Just visit syntatic expression as this is what users actually write.
2339 VisitStmt(POE->getSyntacticForm());
2340 }
2341
2342 void VisitOpaqueValueExpr(const OpaqueValueExpr* OVE) {
2343 if (OVE->isUnique())
2344 Visit(OVE->getSourceExpr());
2345 }
2346};
2347
2348} // end anonymous namespace
2349
2350static void dump(llvm::raw_ostream &OS, StringRef FunctionName,
2351 ArrayRef<CounterExpression> Expressions,
2353 OS << FunctionName << ":\n";
2354 CounterMappingContext Ctx(Expressions);
2355 for (const auto &R : Regions) {
2356 OS.indent(2);
2357 switch (R.Kind) {
2358 case CounterMappingRegion::CodeRegion:
2359 break;
2360 case CounterMappingRegion::ExpansionRegion:
2361 OS << "Expansion,";
2362 break;
2363 case CounterMappingRegion::SkippedRegion:
2364 OS << "Skipped,";
2365 break;
2366 case CounterMappingRegion::GapRegion:
2367 OS << "Gap,";
2368 break;
2369 case CounterMappingRegion::BranchRegion:
2370 case CounterMappingRegion::MCDCBranchRegion:
2371 OS << "Branch,";
2372 break;
2373 case CounterMappingRegion::MCDCDecisionRegion:
2374 OS << "Decision,";
2375 break;
2376 }
2377
2378 OS << "File " << R.FileID << ", " << R.LineStart << ":" << R.ColumnStart
2379 << " -> " << R.LineEnd << ":" << R.ColumnEnd << " = ";
2380
2381 if (const auto *DecisionParams =
2382 std::get_if<mcdc::DecisionParameters>(&R.MCDCParams)) {
2383 OS << "M:" << DecisionParams->BitmapIdx;
2384 OS << ", C:" << DecisionParams->NumConditions;
2385 } else {
2386 Ctx.dump(R.Count, OS);
2387
2388 if (R.Kind == CounterMappingRegion::BranchRegion ||
2389 R.Kind == CounterMappingRegion::MCDCBranchRegion) {
2390 OS << ", ";
2391 Ctx.dump(R.FalseCount, OS);
2392 }
2393 }
2394
2395 if (const auto *BranchParams =
2396 std::get_if<mcdc::BranchParameters>(&R.MCDCParams)) {
2397 OS << " [" << BranchParams->ID + 1 << ","
2398 << BranchParams->Conds[true] + 1;
2399 OS << "," << BranchParams->Conds[false] + 1 << "] ";
2400 }
2401
2402 if (R.Kind == CounterMappingRegion::ExpansionRegion)
2403 OS << " (Expanded file = " << R.ExpandedFileID << ")";
2404 OS << "\n";
2405 }
2406}
2407
2409 CodeGenModule &CGM, CoverageSourceInfo &SourceInfo)
2410 : CGM(CGM), SourceInfo(SourceInfo) {}
2411
2412std::string CoverageMappingModuleGen::getCurrentDirname() {
2413 if (!CGM.getCodeGenOpts().CoverageCompilationDir.empty())
2415
2416 SmallString<256> CWD;
2417 llvm::sys::fs::current_path(CWD);
2418 return CWD.str().str();
2419}
2420
2421std::string CoverageMappingModuleGen::normalizeFilename(StringRef Filename) {
2423 llvm::sys::path::remove_dots(Path, /*remove_dot_dot=*/true);
2424
2425 /// Traverse coverage prefix map in reverse order because prefix replacements
2426 /// are applied in reverse order starting from the last one when multiple
2427 /// prefix replacement options are provided.
2428 for (const auto &[From, To] :
2429 llvm::reverse(CGM.getCodeGenOpts().CoveragePrefixMap)) {
2430 if (llvm::sys::path::replace_path_prefix(Path, From, To))
2431 break;
2432 }
2433 return Path.str().str();
2434}
2435
2436static std::string getInstrProfSection(const CodeGenModule &CGM,
2437 llvm::InstrProfSectKind SK) {
2438 return llvm::getInstrProfSectionName(
2439 SK, CGM.getContext().getTargetInfo().getTriple().getObjectFormat());
2440}
2441
2442void CoverageMappingModuleGen::emitFunctionMappingRecord(
2443 const FunctionInfo &Info, uint64_t FilenamesRef) {
2444 llvm::LLVMContext &Ctx = CGM.getLLVMContext();
2445
2446 // Assign a name to the function record. This is used to merge duplicates.
2447 std::string FuncRecordName = "__covrec_" + llvm::utohexstr(Info.NameHash);
2448
2449 // A dummy description for a function included-but-not-used in a TU can be
2450 // replaced by full description provided by a different TU. The two kinds of
2451 // descriptions play distinct roles: therefore, assign them different names
2452 // to prevent `linkonce_odr` merging.
2453 if (Info.IsUsed)
2454 FuncRecordName += "u";
2455
2456 // Create the function record type.
2457 const uint64_t NameHash = Info.NameHash;
2458 const uint64_t FuncHash = Info.FuncHash;
2459 const std::string &CoverageMapping = Info.CoverageMapping;
2460#define COVMAP_FUNC_RECORD(Type, LLVMType, Name, Init) LLVMType,
2461 llvm::Type *FunctionRecordTypes[] = {
2462#include "llvm/ProfileData/InstrProfData.inc"
2463 };
2464 auto *FunctionRecordTy =
2465 llvm::StructType::get(Ctx, ArrayRef(FunctionRecordTypes),
2466 /*isPacked=*/true);
2467
2468 // Create the function record constant.
2469#define COVMAP_FUNC_RECORD(Type, LLVMType, Name, Init) Init,
2470 llvm::Constant *FunctionRecordVals[] = {
2471 #include "llvm/ProfileData/InstrProfData.inc"
2472 };
2473 auto *FuncRecordConstant =
2474 llvm::ConstantStruct::get(FunctionRecordTy, ArrayRef(FunctionRecordVals));
2475
2476 // Create the function record global.
2477 auto *FuncRecord = new llvm::GlobalVariable(
2478 CGM.getModule(), FunctionRecordTy, /*isConstant=*/true,
2479 llvm::GlobalValue::LinkOnceODRLinkage, FuncRecordConstant,
2480 FuncRecordName);
2481 FuncRecord->setVisibility(llvm::GlobalValue::HiddenVisibility);
2482 FuncRecord->setSection(getInstrProfSection(CGM, llvm::IPSK_covfun));
2483 FuncRecord->setAlignment(llvm::Align(8));
2484 if (CGM.supportsCOMDAT())
2485 FuncRecord->setComdat(CGM.getModule().getOrInsertComdat(FuncRecordName));
2486
2487 // Make sure the data doesn't get deleted.
2488 CGM.addUsedGlobal(FuncRecord);
2489}
2490
2492 llvm::GlobalVariable *NamePtr, StringRef NameValue, uint64_t FuncHash,
2493 const std::string &CoverageMapping, bool IsUsed) {
2494 const uint64_t NameHash = llvm::IndexedInstrProf::ComputeHash(NameValue);
2495 FunctionRecords.push_back({NameHash, FuncHash, CoverageMapping, IsUsed});
2496
2497 if (!IsUsed)
2498 FunctionNames.push_back(NamePtr);
2499
2500 if (CGM.getCodeGenOpts().DumpCoverageMapping) {
2501 // Dump the coverage mapping data for this function by decoding the
2502 // encoded data. This allows us to dump the mapping regions which were
2503 // also processed by the CoverageMappingWriter which performs
2504 // additional minimization operations such as reducing the number of
2505 // expressions.
2507 std::vector<StringRef> Filenames;
2508 std::vector<CounterExpression> Expressions;
2509 std::vector<CounterMappingRegion> Regions;
2510 FilenameStrs.resize(FileEntries.size() + 1);
2511 FilenameStrs[0] = normalizeFilename(getCurrentDirname());
2512 for (const auto &Entry : FileEntries) {
2513 auto I = Entry.second;
2514 FilenameStrs[I] = normalizeFilename(Entry.first.getName());
2515 }
2516 ArrayRef<std::string> FilenameRefs = llvm::ArrayRef(FilenameStrs);
2517 RawCoverageMappingReader Reader(CoverageMapping, FilenameRefs, Filenames,
2518 Expressions, Regions);
2519 if (Reader.read())
2520 return;
2521 dump(llvm::outs(), NameValue, Expressions, Regions);
2522 }
2523}
2524
2526 if (FunctionRecords.empty())
2527 return;
2528 llvm::LLVMContext &Ctx = CGM.getLLVMContext();
2529 auto *Int32Ty = llvm::Type::getInt32Ty(Ctx);
2530
2531 // Create the filenames and merge them with coverage mappings
2533 FilenameStrs.resize(FileEntries.size() + 1);
2534 // The first filename is the current working directory.
2535 FilenameStrs[0] = normalizeFilename(getCurrentDirname());
2536 for (const auto &Entry : FileEntries) {
2537 auto I = Entry.second;
2538 FilenameStrs[I] = normalizeFilename(Entry.first.getName());
2539 }
2540
2541 std::string Filenames;
2542 {
2543 llvm::raw_string_ostream OS(Filenames);
2544 CoverageFilenamesSectionWriter(FilenameStrs).write(OS);
2545 }
2546 auto *FilenamesVal =
2547 llvm::ConstantDataArray::getString(Ctx, Filenames, false);
2548 const int64_t FilenamesRef = llvm::IndexedInstrProf::ComputeHash(Filenames);
2549
2550 // Emit the function records.
2551 for (const FunctionInfo &Info : FunctionRecords)
2552 emitFunctionMappingRecord(Info, FilenamesRef);
2553
2554 const unsigned NRecords = 0;
2555 const size_t FilenamesSize = Filenames.size();
2556 const unsigned CoverageMappingSize = 0;
2557 llvm::Type *CovDataHeaderTypes[] = {
2558#define COVMAP_HEADER(Type, LLVMType, Name, Init) LLVMType,
2559#include "llvm/ProfileData/InstrProfData.inc"
2560 };
2561 auto CovDataHeaderTy =
2562 llvm::StructType::get(Ctx, ArrayRef(CovDataHeaderTypes));
2563 llvm::Constant *CovDataHeaderVals[] = {
2564#define COVMAP_HEADER(Type, LLVMType, Name, Init) Init,
2565#include "llvm/ProfileData/InstrProfData.inc"
2566 };
2567 auto CovDataHeaderVal =
2568 llvm::ConstantStruct::get(CovDataHeaderTy, ArrayRef(CovDataHeaderVals));
2569
2570 // Create the coverage data record
2571 llvm::Type *CovDataTypes[] = {CovDataHeaderTy, FilenamesVal->getType()};
2572 auto CovDataTy = llvm::StructType::get(Ctx, ArrayRef(CovDataTypes));
2573 llvm::Constant *TUDataVals[] = {CovDataHeaderVal, FilenamesVal};
2574 auto CovDataVal = llvm::ConstantStruct::get(CovDataTy, ArrayRef(TUDataVals));
2575 auto CovData = new llvm::GlobalVariable(
2576 CGM.getModule(), CovDataTy, true, llvm::GlobalValue::PrivateLinkage,
2577 CovDataVal, llvm::getCoverageMappingVarName());
2578
2579 CovData->setSection(getInstrProfSection(CGM, llvm::IPSK_covmap));
2580 CovData->setAlignment(llvm::Align(8));
2581
2582 // Make sure the data doesn't get deleted.
2583 CGM.addUsedGlobal(CovData);
2584 // Create the deferred function records array
2585 if (!FunctionNames.empty()) {
2586 auto NamesArrTy = llvm::ArrayType::get(llvm::PointerType::getUnqual(Ctx),
2587 FunctionNames.size());
2588 auto NamesArrVal = llvm::ConstantArray::get(NamesArrTy, FunctionNames);
2589 // This variable will *NOT* be emitted to the object file. It is used
2590 // to pass the list of names referenced to codegen.
2591 new llvm::GlobalVariable(CGM.getModule(), NamesArrTy, true,
2592 llvm::GlobalValue::InternalLinkage, NamesArrVal,
2593 llvm::getCoverageUnusedNamesVarName());
2594 }
2595}
2596
2598 auto It = FileEntries.find(File);
2599 if (It != FileEntries.end())
2600 return It->second;
2601 unsigned FileID = FileEntries.size() + 1;
2602 FileEntries.insert(std::make_pair(File, FileID));
2603 return FileID;
2604}
2605
2607 llvm::raw_ostream &OS) {
2608 assert(CounterMap && MCDCState);
2609 CounterCoverageMappingBuilder Walker(CVM, *CounterMap, *MCDCState, SM,
2610 LangOpts);
2611 Walker.VisitDecl(D);
2612 Walker.write(OS);
2613}
2614
2616 llvm::raw_ostream &OS) {
2617 EmptyCoverageMappingBuilder Walker(CVM, SM, LangOpts);
2618 Walker.VisitDecl(D);
2619 Walker.write(OS);
2620}
NodeId Parent
Definition: ASTDiff.cpp:191
static char ID
Definition: Arena.cpp:183
#define SM(sm)
Definition: Cuda.cpp:83
Defines the Diagnostic-related interfaces.
static const MemRegion * getRegion(const CallEvent &Call, const MutexDescriptor &Descriptor, bool IsLock)
const Decl * D
IndirectLocalPath & Path
Expr * E
static std::string getInstrProfSection(const CodeGenModule &CGM, llvm::InstrProfSectKind SK)
static void dump(llvm::raw_ostream &OS, StringRef FunctionName, ArrayRef< CounterExpression > Expressions, ArrayRef< CounterMappingRegion > Regions)
static llvm::cl::opt< bool > EmptyLineCommentCoverage("emptyline-comment-coverage", llvm::cl::desc("Emit emptylines and comment lines as skipped regions (only " "disable it on test)"), llvm::cl::init(true), llvm::cl::Hidden)
Defines the clang::FileManager interface and associated types.
StringRef Filename
Definition: Format.cpp:3001
llvm::DenseSet< const void * > Visited
Definition: HTMLLogger.cpp:146
static DiagnosticBuilder Diag(DiagnosticsEngine *Diags, const LangOptions &Features, FullSourceLoc TokLoc, const char *TokBegin, const char *TokRangeBegin, const char *TokRangeEnd, unsigned DiagID)
Produce a diagnostic highlighting some portion of a literal.
SourceRange Range
Definition: SemaObjC.cpp:758
SourceLocation Loc
Definition: SemaObjC.cpp:759
const TargetInfo & getTargetInfo() const
Definition: ASTContext.h:779
AbstractConditionalOperator - An abstract base class for ConditionalOperator and BinaryConditionalOpe...
Definition: Expr.h:4175
Represents a loop initializing the elements of an array.
Definition: Expr.h:5703
OpaqueValueExpr * getCommonExpr() const
Get the common subexpression shared by all initializations (the source array).
Definition: Expr.h:5718
A builtin binary operation expression such as "x + y" or "x <= y".
Definition: Expr.h:3860
BreakStmt - This represents a break.
Definition: Stmt.h:2990
CXXCatchStmt - This represents a C++ catch block.
Definition: StmtCXX.h:28
CXXForRangeStmt - This represents C++0x [stmt.ranged]'s ranged for statement, represented as 'for (ra...
Definition: StmtCXX.h:135
A C++ throw-expression (C++ [except.throw]).
Definition: ExprCXX.h:1206
CXXTryStmt - A C++ try block, including all handlers.
Definition: StmtCXX.h:69
CallExpr - Represents a function call (C99 6.5.2.2, C++ [expr.call]).
Definition: Expr.h:2830
llvm::SmallVector< std::pair< std::string, std::string >, 0 > CoveragePrefixMap
Prefix replacement map for source-based code coverage to remap source file paths in coverage mapping.
std::string CoverageCompilationDir
The string to embed in coverage mapping as the current working directory.
This class organizes the cross-function state that is used while generating LLVM code.
llvm::Module & getModule() const
DiagnosticsEngine & getDiags() const
void addUsedGlobal(llvm::GlobalValue *GV)
Add a global to a list to be added to the llvm.used metadata.
ASTContext & getContext() const
const CodeGenOptions & getCodeGenOpts() const
llvm::LLVMContext & getLLVMContext()
void emitEmptyMapping(const Decl *D, llvm::raw_ostream &OS)
Emit the coverage mapping data for an unused function.
void emitCounterMapping(const Decl *D, llvm::raw_ostream &OS)
Emit the coverage mapping data which maps the regions of code to counters that will be used to find t...
Organizes the cross-function state that is used while generating code coverage mapping data.
void addFunctionMappingRecord(llvm::GlobalVariable *FunctionName, StringRef FunctionNameValue, uint64_t FunctionHash, const std::string &CoverageMapping, bool IsUsed=true)
Add a function's coverage mapping record to the collection of the function mapping records.
CoverageSourceInfo & getSourceInfo() const
static CoverageSourceInfo * setUpCoverageCallbacks(Preprocessor &PP)
CoverageMappingModuleGen(CodeGenModule &CGM, CoverageSourceInfo &SourceInfo)
void emit()
Emit the coverage mapping data for a translation unit.
CodeGenModule & getCodeGenModule()
Return an interface into CodeGenModule.
unsigned getFileID(FileEntryRef File)
Return the coverage mapping translation unit file id for the given file.
ConstStmtVisitor - This class implements a simple visitor for Stmt subclasses.
Definition: StmtVisitor.h:195
ContinueStmt - This represents a continue.
Definition: Stmt.h:2960
Represents a 'co_return' statement in the C++ Coroutines TS.
Definition: StmtCXX.h:473
Represents the body of a coroutine.
Definition: StmtCXX.h:320
Represents an expression that might suspend coroutine execution; either a co_await or co_yield expres...
Definition: ExprCXX.h:5071
Stores additional source code information like skipped ranges which is required by the coverage mappi...
void SourceRangeSkipped(SourceRange Range, SourceLocation EndifLoc) override
Hook called when a source range is skipped.
void updateNextTokLoc(SourceLocation Loc)
void AddSkippedRange(SourceRange Range, SkippedRange::Kind RangeKind)
std::vector< SkippedRange > & getSkippedRanges()
bool HandleComment(Preprocessor &PP, SourceRange Range) override
void HandleEmptyline(SourceRange Range) override
Decl - This represents one declaration (or definition), e.g.
Definition: DeclBase.h:86
virtual Stmt * getBody() const
getBody - If this Decl represents a declaration for a body of code, such as a function or method defi...
Definition: DeclBase.h:1077
virtual bool hasBody() const
Returns true if this Decl represents a declaration for a body of code, such as a function or method d...
Definition: DeclBase.h:1083
DoStmt - This represents a 'do/while' stmt.
Definition: Stmt.h:2735
This represents one expression.
Definition: Expr.h:110
bool EvaluateAsInt(EvalResult &Result, const ASTContext &Ctx, SideEffectsKind AllowSideEffects=SE_NoSideEffects, bool InConstantContext=false) const
EvaluateAsInt - Return true if this is a constant which we can fold and convert to an integer,...
bool isValueDependent() const
Determines whether the value of this expression depends on.
Definition: Expr.h:175
bool EvaluateAsBooleanCondition(bool &Result, const ASTContext &Ctx, bool InConstantContext=false) const
EvaluateAsBooleanCondition - Return true if this is a constant which we can fold and convert to a boo...
QualType getType() const
Definition: Expr.h:142
A reference to a FileEntry that includes the name of the file as it was accessed by the FileManager's...
Definition: FileEntry.h:57
An opaque identifier used by SourceManager which refers to a source file (MemoryBuffer) along with it...
ForStmt - This represents a 'for (init;cond;inc)' stmt.
Definition: Stmt.h:2791
bool getNoReturn() const
Definition: Type.h:4467
GotoStmt - This represents a direct goto.
Definition: Stmt.h:2872
IfStmt - This represents an if/then/else.
Definition: Stmt.h:2148
LabelStmt - Represents a label, which has a substatement.
Definition: Stmt.h:2041
A C++ lambda expression, which produces a function object (of unspecified type) that can be invoked l...
Definition: ExprCXX.h:1954
Keeps track of the various options that can be enabled, which controls the dialect of C or C++ that i...
Definition: LangOptions.h:476
static unsigned MeasureTokenLength(SourceLocation Loc, const SourceManager &SM, const LangOptions &LangOpts)
MeasureTokenLength - Relex the token at the specified location and return its length in bytes in the ...
Definition: Lexer.cpp:499
Represents Objective-C's collection statement.
Definition: StmtObjC.h:23
OpaqueValueExpr - An expression referring to an opaque object of a fixed type and value class.
Definition: Expr.h:1173
Expr * getSourceExpr() const
The source expression of an opaque value expression is the expression which originally generated the ...
Definition: Expr.h:1223
bool isUnique() const
Definition: Expr.h:1231
Engages in a tight little dance with the lexer to efficiently preprocess tokens.
Definition: Preprocessor.h:137
void addCommentHandler(CommentHandler *Handler)
Add the specified comment handler to the preprocessor.
void addPPCallbacks(std::unique_ptr< PPCallbacks > C)
SourceManager & getSourceManager() const
void setPreprocessToken(bool Preprocess)
void setTokenWatcher(llvm::unique_function< void(const clang::Token &)> F)
Register a function that would be called on each token in the final expanded token stream.
void setEmptylineHandler(EmptylineHandler *Handler)
Set empty line handler.
PseudoObjectExpr - An expression which accesses a pseudo-object l-value.
Definition: Expr.h:6497
Expr * getSyntacticForm()
Return the syntactic form of this expression, i.e.
Definition: Expr.h:6539
A (possibly-)qualified type.
Definition: Type.h:941
ReturnStmt - This represents a return, optionally of an expression: return; return 4;.
Definition: Stmt.h:3029
Encodes a location in the source.
bool isValid() const
Return true if this is a valid SourceLocation object.
SourceLocation getLocWithOffset(IntTy Offset) const
Return a source location with the specified offset from this SourceLocation.
This class handles loading and caching of source files into memory.
A trivial tuple used to represent a source range.
SourceLocation getEnd() const
SourceLocation getBegin() const
Each ExpansionInfo encodes the expansion location - where the token was ultimately expanded,...
SourceLocation getExpansionLocStart() const
bool isFunctionMacroExpansion() const
SourceLocation getExpansionLocEnd() const
Stmt - This represents one statement.
Definition: Stmt.h:84
SourceLocation getEndLoc() const LLVM_READONLY
Definition: Stmt.cpp:350
SourceLocation getBeginLoc() const LLVM_READONLY
Definition: Stmt.cpp:338
SourceLocation getColonLoc() const
Definition: Stmt.h:1790
const SwitchCase * getNextSwitchCase() const
Definition: Stmt.h:1784
SwitchStmt - This represents a 'switch' stmt.
Definition: Stmt.h:2398
const llvm::Triple & getTriple() const
Returns the target triple of the primary target.
Definition: TargetInfo.h:1256
Token - This structure provides full information about a lexed token.
Definition: Token.h:36
SourceLocation getLocation() const
Return a source location identifier for the specified offset in the current file.
Definition: Token.h:132
tok::TokenKind getKind() const
Definition: Token.h:94
WhileStmt - This represents a 'while' stmt.
Definition: Stmt.h:2594
llvm::cl::opt< std::string > Filter
The JSON file list parser is used to communicate input to InstallAPI.
FunctionType::ExtInfo getFunctionExtInfo(const Type &t)
Definition: Type.h:7903
unsigned long uint64_t
cl::opt< bool > SystemHeadersCoverage
Diagnostic wrappers for TextAPI types for error reporting.
Definition: Dominators.h:30
cl::opt< bool > EnableSingleByteCoverage
#define false
Definition: stdbool.h:26
Per-Function MC/DC state.
Definition: MCDCState.h:29
llvm::DenseMap< const Stmt *, Branch > BranchByStmt
Definition: MCDCState.h:44
llvm::DenseMap< const Stmt *, Decision > DecisionByStmt
Definition: MCDCState.h:37
EvalResult is a struct with detailed info about an evaluated expression.
Definition: Expr.h:642