1204643Srdivacky//=- ReachableCodePathInsensitive.cpp ---------------------------*- C++ --*-==//
2204643Srdivacky//
3204643Srdivacky//                     The LLVM Compiler Infrastructure
4204643Srdivacky//
5204643Srdivacky// This file is distributed under the University of Illinois Open Source
6204643Srdivacky// License. See LICENSE.TXT for details.
7204643Srdivacky//
8204643Srdivacky//===----------------------------------------------------------------------===//
9204643Srdivacky//
10204643Srdivacky// This file implements a flow-sensitive, path-insensitive analysis of
11204643Srdivacky// determining reachable blocks within a CFG.
12204643Srdivacky//
13204643Srdivacky//===----------------------------------------------------------------------===//
14204643Srdivacky
15249423Sdim#include "clang/Analysis/Analyses/ReachableCode.h"
16204643Srdivacky#include "clang/AST/Expr.h"
17204643Srdivacky#include "clang/AST/ExprCXX.h"
18224145Sdim#include "clang/AST/ExprObjC.h"
19204643Srdivacky#include "clang/AST/StmtCXX.h"
20249423Sdim#include "clang/Analysis/AnalysisContext.h"
21204643Srdivacky#include "clang/Analysis/CFG.h"
22204643Srdivacky#include "clang/Basic/SourceManager.h"
23249423Sdim#include "llvm/ADT/BitVector.h"
24249423Sdim#include "llvm/ADT/SmallVector.h"
25204643Srdivacky
26204643Srdivackyusing namespace clang;
27204643Srdivacky
28226633Sdimnamespace {
29226633Sdimclass DeadCodeScan {
30226633Sdim  llvm::BitVector Visited;
31226633Sdim  llvm::BitVector &Reachable;
32249423Sdim  SmallVector<const CFGBlock *, 10> WorkList;
33226633Sdim
34249423Sdim  typedef SmallVector<std::pair<const CFGBlock *, const Stmt *>, 12>
35226633Sdim      DeferredLocsTy;
36226633Sdim
37226633Sdim  DeferredLocsTy DeferredLocs;
38226633Sdim
39226633Sdimpublic:
40226633Sdim  DeadCodeScan(llvm::BitVector &reachable)
41226633Sdim    : Visited(reachable.size()),
42226633Sdim      Reachable(reachable) {}
43226633Sdim
44226633Sdim  void enqueue(const CFGBlock *block);
45226633Sdim  unsigned scanBackwards(const CFGBlock *Start,
46226633Sdim                         clang::reachable_code::Callback &CB);
47226633Sdim
48226633Sdim  bool isDeadCodeRoot(const CFGBlock *Block);
49226633Sdim
50226633Sdim  const Stmt *findDeadCode(const CFGBlock *Block);
51226633Sdim
52226633Sdim  void reportDeadCode(const Stmt *S,
53226633Sdim                      clang::reachable_code::Callback &CB);
54226633Sdim};
55226633Sdim}
56226633Sdim
57226633Sdimvoid DeadCodeScan::enqueue(const CFGBlock *block) {
58226633Sdim  unsigned blockID = block->getBlockID();
59226633Sdim  if (Reachable[blockID] || Visited[blockID])
60226633Sdim    return;
61226633Sdim  Visited[blockID] = true;
62226633Sdim  WorkList.push_back(block);
63226633Sdim}
64226633Sdim
65226633Sdimbool DeadCodeScan::isDeadCodeRoot(const clang::CFGBlock *Block) {
66226633Sdim  bool isDeadRoot = true;
67226633Sdim
68226633Sdim  for (CFGBlock::const_pred_iterator I = Block->pred_begin(),
69226633Sdim        E = Block->pred_end(); I != E; ++I) {
70226633Sdim    if (const CFGBlock *PredBlock = *I) {
71226633Sdim      unsigned blockID = PredBlock->getBlockID();
72226633Sdim      if (Visited[blockID]) {
73226633Sdim        isDeadRoot = false;
74226633Sdim        continue;
75226633Sdim      }
76226633Sdim      if (!Reachable[blockID]) {
77226633Sdim        isDeadRoot = false;
78226633Sdim        Visited[blockID] = true;
79226633Sdim        WorkList.push_back(PredBlock);
80226633Sdim        continue;
81226633Sdim      }
82226633Sdim    }
83226633Sdim  }
84226633Sdim
85226633Sdim  return isDeadRoot;
86226633Sdim}
87226633Sdim
88226633Sdimstatic bool isValidDeadStmt(const Stmt *S) {
89226633Sdim  if (S->getLocStart().isInvalid())
90226633Sdim    return false;
91226633Sdim  if (const BinaryOperator *BO = dyn_cast<BinaryOperator>(S))
92226633Sdim    return BO->getOpcode() != BO_Comma;
93226633Sdim  return true;
94226633Sdim}
95226633Sdim
96226633Sdimconst Stmt *DeadCodeScan::findDeadCode(const clang::CFGBlock *Block) {
97226633Sdim  for (CFGBlock::const_iterator I = Block->begin(), E = Block->end(); I!=E; ++I)
98249423Sdim    if (Optional<CFGStmt> CS = I->getAs<CFGStmt>()) {
99226633Sdim      const Stmt *S = CS->getStmt();
100226633Sdim      if (isValidDeadStmt(S))
101226633Sdim        return S;
102226633Sdim    }
103226633Sdim
104226633Sdim  if (CFGTerminator T = Block->getTerminator()) {
105226633Sdim    const Stmt *S = T.getStmt();
106226633Sdim    if (isValidDeadStmt(S))
107226633Sdim      return S;
108226633Sdim  }
109226633Sdim
110226633Sdim  return 0;
111226633Sdim}
112226633Sdim
113263508Sdimstatic int SrcCmp(const std::pair<const CFGBlock *, const Stmt *> *p1,
114263508Sdim                  const std::pair<const CFGBlock *, const Stmt *> *p2) {
115263508Sdim  if (p1->second->getLocStart() < p2->second->getLocStart())
116263508Sdim    return -1;
117263508Sdim  if (p2->second->getLocStart() < p1->second->getLocStart())
118263508Sdim    return 1;
119263508Sdim  return 0;
120226633Sdim}
121226633Sdim
122226633Sdimunsigned DeadCodeScan::scanBackwards(const clang::CFGBlock *Start,
123226633Sdim                                     clang::reachable_code::Callback &CB) {
124226633Sdim
125226633Sdim  unsigned count = 0;
126226633Sdim  enqueue(Start);
127226633Sdim
128226633Sdim  while (!WorkList.empty()) {
129226633Sdim    const CFGBlock *Block = WorkList.pop_back_val();
130226633Sdim
131226633Sdim    // It is possible that this block has been marked reachable after
132226633Sdim    // it was enqueued.
133226633Sdim    if (Reachable[Block->getBlockID()])
134226633Sdim      continue;
135226633Sdim
136226633Sdim    // Look for any dead code within the block.
137226633Sdim    const Stmt *S = findDeadCode(Block);
138226633Sdim
139226633Sdim    if (!S) {
140226633Sdim      // No dead code.  Possibly an empty block.  Look at dead predecessors.
141226633Sdim      for (CFGBlock::const_pred_iterator I = Block->pred_begin(),
142226633Sdim           E = Block->pred_end(); I != E; ++I) {
143226633Sdim        if (const CFGBlock *predBlock = *I)
144226633Sdim          enqueue(predBlock);
145226633Sdim      }
146226633Sdim      continue;
147226633Sdim    }
148226633Sdim
149226633Sdim    // Specially handle macro-expanded code.
150226633Sdim    if (S->getLocStart().isMacroID()) {
151226633Sdim      count += clang::reachable_code::ScanReachableFromBlock(Block, Reachable);
152226633Sdim      continue;
153226633Sdim    }
154226633Sdim
155226633Sdim    if (isDeadCodeRoot(Block)) {
156226633Sdim      reportDeadCode(S, CB);
157226633Sdim      count += clang::reachable_code::ScanReachableFromBlock(Block, Reachable);
158226633Sdim    }
159226633Sdim    else {
160226633Sdim      // Record this statement as the possibly best location in a
161226633Sdim      // strongly-connected component of dead code for emitting a
162226633Sdim      // warning.
163226633Sdim      DeferredLocs.push_back(std::make_pair(Block, S));
164226633Sdim    }
165226633Sdim  }
166226633Sdim
167226633Sdim  // If we didn't find a dead root, then report the dead code with the
168226633Sdim  // earliest location.
169226633Sdim  if (!DeferredLocs.empty()) {
170226633Sdim    llvm::array_pod_sort(DeferredLocs.begin(), DeferredLocs.end(), SrcCmp);
171226633Sdim    for (DeferredLocsTy::iterator I = DeferredLocs.begin(),
172226633Sdim          E = DeferredLocs.end(); I != E; ++I) {
173226633Sdim      const CFGBlock *block = I->first;
174226633Sdim      if (Reachable[block->getBlockID()])
175226633Sdim        continue;
176226633Sdim      reportDeadCode(I->second, CB);
177226633Sdim      count += clang::reachable_code::ScanReachableFromBlock(block, Reachable);
178226633Sdim    }
179226633Sdim  }
180226633Sdim
181226633Sdim  return count;
182226633Sdim}
183226633Sdim
184226633Sdimstatic SourceLocation GetUnreachableLoc(const Stmt *S,
185226633Sdim                                        SourceRange &R1,
186204643Srdivacky                                        SourceRange &R2) {
187204643Srdivacky  R1 = R2 = SourceRange();
188204643Srdivacky
189218893Sdim  if (const Expr *Ex = dyn_cast<Expr>(S))
190218893Sdim    S = Ex->IgnoreParenImpCasts();
191218893Sdim
192204643Srdivacky  switch (S->getStmtClass()) {
193204643Srdivacky    case Expr::BinaryOperatorClass: {
194204643Srdivacky      const BinaryOperator *BO = cast<BinaryOperator>(S);
195204643Srdivacky      return BO->getOperatorLoc();
196204643Srdivacky    }
197204643Srdivacky    case Expr::UnaryOperatorClass: {
198204643Srdivacky      const UnaryOperator *UO = cast<UnaryOperator>(S);
199204643Srdivacky      R1 = UO->getSubExpr()->getSourceRange();
200204643Srdivacky      return UO->getOperatorLoc();
201204643Srdivacky    }
202204643Srdivacky    case Expr::CompoundAssignOperatorClass: {
203204643Srdivacky      const CompoundAssignOperator *CAO = cast<CompoundAssignOperator>(S);
204204643Srdivacky      R1 = CAO->getLHS()->getSourceRange();
205204643Srdivacky      R2 = CAO->getRHS()->getSourceRange();
206204643Srdivacky      return CAO->getOperatorLoc();
207204643Srdivacky    }
208218893Sdim    case Expr::BinaryConditionalOperatorClass:
209204643Srdivacky    case Expr::ConditionalOperatorClass: {
210218893Sdim      const AbstractConditionalOperator *CO =
211218893Sdim        cast<AbstractConditionalOperator>(S);
212204643Srdivacky      return CO->getQuestionLoc();
213204643Srdivacky    }
214204643Srdivacky    case Expr::MemberExprClass: {
215204643Srdivacky      const MemberExpr *ME = cast<MemberExpr>(S);
216204643Srdivacky      R1 = ME->getSourceRange();
217204643Srdivacky      return ME->getMemberLoc();
218204643Srdivacky    }
219204643Srdivacky    case Expr::ArraySubscriptExprClass: {
220204643Srdivacky      const ArraySubscriptExpr *ASE = cast<ArraySubscriptExpr>(S);
221204643Srdivacky      R1 = ASE->getLHS()->getSourceRange();
222204643Srdivacky      R2 = ASE->getRHS()->getSourceRange();
223204643Srdivacky      return ASE->getRBracketLoc();
224204643Srdivacky    }
225204643Srdivacky    case Expr::CStyleCastExprClass: {
226204643Srdivacky      const CStyleCastExpr *CSC = cast<CStyleCastExpr>(S);
227204643Srdivacky      R1 = CSC->getSubExpr()->getSourceRange();
228204643Srdivacky      return CSC->getLParenLoc();
229204643Srdivacky    }
230204643Srdivacky    case Expr::CXXFunctionalCastExprClass: {
231204643Srdivacky      const CXXFunctionalCastExpr *CE = cast <CXXFunctionalCastExpr>(S);
232204643Srdivacky      R1 = CE->getSubExpr()->getSourceRange();
233263508Sdim      return CE->getLocStart();
234204643Srdivacky    }
235204643Srdivacky    case Stmt::CXXTryStmtClass: {
236204643Srdivacky      return cast<CXXTryStmt>(S)->getHandler(0)->getCatchLoc();
237204643Srdivacky    }
238224145Sdim    case Expr::ObjCBridgedCastExprClass: {
239224145Sdim      const ObjCBridgedCastExpr *CSC = cast<ObjCBridgedCastExpr>(S);
240224145Sdim      R1 = CSC->getSubExpr()->getSourceRange();
241224145Sdim      return CSC->getLParenLoc();
242224145Sdim    }
243204643Srdivacky    default: ;
244204643Srdivacky  }
245204643Srdivacky  R1 = S->getSourceRange();
246204643Srdivacky  return S->getLocStart();
247204643Srdivacky}
248204643Srdivacky
249226633Sdimvoid DeadCodeScan::reportDeadCode(const Stmt *S,
250226633Sdim                                  clang::reachable_code::Callback &CB) {
251204643Srdivacky  SourceRange R1, R2;
252226633Sdim  SourceLocation Loc = GetUnreachableLoc(S, R1, R2);
253226633Sdim  CB.HandleUnreachable(Loc, R1, R2);
254204643Srdivacky}
255204643Srdivacky
256204643Srdivackynamespace clang { namespace reachable_code {
257234353Sdim
258234353Sdimvoid Callback::anchor() { }
259234353Sdim
260226633Sdimunsigned ScanReachableFromBlock(const CFGBlock *Start,
261204643Srdivacky                                llvm::BitVector &Reachable) {
262204643Srdivacky  unsigned count = 0;
263226633Sdim
264221345Sdim  // Prep work queue
265226633Sdim  SmallVector<const CFGBlock*, 32> WL;
266226633Sdim
267226633Sdim  // The entry block may have already been marked reachable
268226633Sdim  // by the caller.
269226633Sdim  if (!Reachable[Start->getBlockID()]) {
270226633Sdim    ++count;
271226633Sdim    Reachable[Start->getBlockID()] = true;
272226633Sdim  }
273226633Sdim
274226633Sdim  WL.push_back(Start);
275226633Sdim
276218893Sdim  // Find the reachable blocks from 'Start'.
277204643Srdivacky  while (!WL.empty()) {
278226633Sdim    const CFGBlock *item = WL.pop_back_val();
279226633Sdim
280226633Sdim    // Look at the successors and mark then reachable.
281226633Sdim    for (CFGBlock::const_succ_iterator I = item->succ_begin(),
282226633Sdim         E = item->succ_end(); I != E; ++I)
283204643Srdivacky      if (const CFGBlock *B = *I) {
284204643Srdivacky        unsigned blockID = B->getBlockID();
285204643Srdivacky        if (!Reachable[blockID]) {
286204643Srdivacky          Reachable.set(blockID);
287226633Sdim          WL.push_back(B);
288204643Srdivacky          ++count;
289204643Srdivacky        }
290204643Srdivacky      }
291204643Srdivacky  }
292204643Srdivacky  return count;
293204643Srdivacky}
294226633Sdim
295234353Sdimvoid FindUnreachableCode(AnalysisDeclContext &AC, Callback &CB) {
296204643Srdivacky  CFG *cfg = AC.getCFG();
297204643Srdivacky  if (!cfg)
298204643Srdivacky    return;
299204643Srdivacky
300226633Sdim  // Scan for reachable blocks from the entrance of the CFG.
301226633Sdim  // If there are no unreachable blocks, we're done.
302204643Srdivacky  llvm::BitVector reachable(cfg->getNumBlockIDs());
303226633Sdim  unsigned numReachable = ScanReachableFromBlock(&cfg->getEntry(), reachable);
304204643Srdivacky  if (numReachable == cfg->getNumBlockIDs())
305204643Srdivacky    return;
306226633Sdim
307226633Sdim  // If there aren't explicit EH edges, we should include the 'try' dispatch
308226633Sdim  // blocks as roots.
309226633Sdim  if (!AC.getCFGBuildOptions().AddEHEdges) {
310226633Sdim    for (CFG::try_block_iterator I = cfg->try_blocks_begin(),
311226633Sdim         E = cfg->try_blocks_end() ; I != E; ++I) {
312226633Sdim      numReachable += ScanReachableFromBlock(*I, reachable);
313204643Srdivacky    }
314226633Sdim    if (numReachable == cfg->getNumBlockIDs())
315226633Sdim      return;
316204643Srdivacky  }
317204643Srdivacky
318226633Sdim  // There are some unreachable blocks.  We need to find the root blocks that
319226633Sdim  // contain code that should be considered unreachable.
320226633Sdim  for (CFG::iterator I = cfg->begin(), E = cfg->end(); I != E; ++I) {
321226633Sdim    const CFGBlock *block = *I;
322226633Sdim    // A block may have been marked reachable during this loop.
323226633Sdim    if (reachable[block->getBlockID()])
324226633Sdim      continue;
325226633Sdim
326226633Sdim    DeadCodeScan DS(reachable);
327226633Sdim    numReachable += DS.scanBackwards(block, CB);
328226633Sdim
329226633Sdim    if (numReachable == cfg->getNumBlockIDs())
330226633Sdim      return;
331204643Srdivacky  }
332204643Srdivacky}
333204643Srdivacky
334204643Srdivacky}} // end namespace clang::reachable_code
335