//===--- PlistDiagnostics.cpp - Plist Diagnostics for Paths -----*- C++ -*-===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file defines the PlistDiagnostics object. // //===----------------------------------------------------------------------===// #include "clang/StaticAnalyzer/Core/PathDiagnosticConsumers.h" #include "clang/StaticAnalyzer/Core/BugReporter/PathDiagnostic.h" #include "clang/Basic/SourceManager.h" #include "clang/Basic/FileManager.h" #include "clang/Lex/Preprocessor.h" #include "llvm/Support/raw_ostream.h" #include "llvm/Support/Casting.h" #include "llvm/ADT/DenseMap.h" #include "llvm/ADT/SmallVector.h" using namespace clang; using namespace ento; typedef llvm::DenseMap FIDMap; namespace { struct CompareDiagnostics { // Compare if 'X' is "<" than 'Y'. bool operator()(const PathDiagnostic *X, const PathDiagnostic *Y) const { // First compare by location const FullSourceLoc &XLoc = X->getLocation().asLocation(); const FullSourceLoc &YLoc = Y->getLocation().asLocation(); if (XLoc < YLoc) return true; if (XLoc != YLoc) return false; // Next, compare by bug type. StringRef XBugType = X->getBugType(); StringRef YBugType = Y->getBugType(); if (XBugType < YBugType) return true; if (XBugType != YBugType) return false; // Next, compare by bug description. StringRef XDesc = X->getDescription(); StringRef YDesc = Y->getDescription(); if (XDesc < YDesc) return true; if (XDesc != YDesc) return false; // FIXME: Further refine by comparing PathDiagnosticPieces? return false; } }; } namespace { class PlistDiagnostics : public PathDiagnosticConsumer { std::vector BatchedDiags; const std::string OutputFile; const LangOptions &LangOpts; llvm::OwningPtr SubPD; bool flushed; public: PlistDiagnostics(const std::string& prefix, const LangOptions &LangOpts, PathDiagnosticConsumer *subPD); ~PlistDiagnostics() { FlushDiagnostics(NULL); } void FlushDiagnostics(SmallVectorImpl *FilesMade); void HandlePathDiagnosticImpl(const PathDiagnostic* D); virtual StringRef getName() const { return "PlistDiagnostics"; } PathGenerationScheme getGenerationScheme() const; bool supportsLogicalOpControlFlow() const { return true; } bool supportsAllBlockEdges() const { return true; } virtual bool useVerboseDescription() const { return false; } }; } // end anonymous namespace PlistDiagnostics::PlistDiagnostics(const std::string& output, const LangOptions &LO, PathDiagnosticConsumer *subPD) : OutputFile(output), LangOpts(LO), SubPD(subPD), flushed(false) {} PathDiagnosticConsumer* ento::createPlistDiagnosticConsumer(const std::string& s, const Preprocessor &PP, PathDiagnosticConsumer *subPD) { return new PlistDiagnostics(s, PP.getLangOptions(), subPD); } PathDiagnosticConsumer::PathGenerationScheme PlistDiagnostics::getGenerationScheme() const { if (const PathDiagnosticConsumer *PD = SubPD.get()) return PD->getGenerationScheme(); return Extensive; } static void AddFID(FIDMap &FIDs, SmallVectorImpl &V, const SourceManager* SM, SourceLocation L) { FileID FID = SM->getFileID(SM->getExpansionLoc(L)); FIDMap::iterator I = FIDs.find(FID); if (I != FIDs.end()) return; FIDs[FID] = V.size(); V.push_back(FID); } static unsigned GetFID(const FIDMap& FIDs, const SourceManager &SM, SourceLocation L) { FileID FID = SM.getFileID(SM.getExpansionLoc(L)); FIDMap::const_iterator I = FIDs.find(FID); assert(I != FIDs.end()); return I->second; } static raw_ostream &Indent(raw_ostream &o, const unsigned indent) { for (unsigned i = 0; i < indent; ++i) o << ' '; return o; } static void EmitLocation(raw_ostream &o, const SourceManager &SM, const LangOptions &LangOpts, SourceLocation L, const FIDMap &FM, unsigned indent, bool extend = false) { FullSourceLoc Loc(SM.getExpansionLoc(L), const_cast(SM)); // Add in the length of the token, so that we cover multi-char tokens. unsigned offset = extend ? Lexer::MeasureTokenLength(Loc, SM, LangOpts) - 1 : 0; Indent(o, indent) << "\n"; Indent(o, indent) << " line" << Loc.getExpansionLineNumber() << "\n"; Indent(o, indent) << " col" << Loc.getExpansionColumnNumber() + offset << "\n"; Indent(o, indent) << " file" << GetFID(FM, SM, Loc) << "\n"; Indent(o, indent) << "\n"; } static void EmitLocation(raw_ostream &o, const SourceManager &SM, const LangOptions &LangOpts, const PathDiagnosticLocation &L, const FIDMap& FM, unsigned indent, bool extend = false) { EmitLocation(o, SM, LangOpts, L.asLocation(), FM, indent, extend); } static void EmitRange(raw_ostream &o, const SourceManager &SM, const LangOptions &LangOpts, PathDiagnosticRange R, const FIDMap &FM, unsigned indent) { Indent(o, indent) << "\n"; EmitLocation(o, SM, LangOpts, R.getBegin(), FM, indent+1); EmitLocation(o, SM, LangOpts, R.getEnd(), FM, indent+1, !R.isPoint); Indent(o, indent) << "\n"; } static raw_ostream &EmitString(raw_ostream &o, const std::string& s) { o << ""; for (std::string::const_iterator I=s.begin(), E=s.end(); I!=E; ++I) { char c = *I; switch (c) { default: o << c; break; case '&': o << "&"; break; case '<': o << "<"; break; case '>': o << ">"; break; case '\'': o << "'"; break; case '\"': o << """; break; } } o << ""; return o; } static void ReportControlFlow(raw_ostream &o, const PathDiagnosticControlFlowPiece& P, const FIDMap& FM, const SourceManager &SM, const LangOptions &LangOpts, unsigned indent) { Indent(o, indent) << "\n"; ++indent; Indent(o, indent) << "kindcontrol\n"; // Emit edges. Indent(o, indent) << "edges\n"; ++indent; Indent(o, indent) << "\n"; ++indent; for (PathDiagnosticControlFlowPiece::const_iterator I=P.begin(), E=P.end(); I!=E; ++I) { Indent(o, indent) << "\n"; ++indent; Indent(o, indent) << "start\n"; EmitRange(o, SM, LangOpts, I->getStart().asRange(), FM, indent+1); Indent(o, indent) << "end\n"; EmitRange(o, SM, LangOpts, I->getEnd().asRange(), FM, indent+1); --indent; Indent(o, indent) << "\n"; } --indent; Indent(o, indent) << "\n"; --indent; // Output any helper text. const std::string& s = P.getString(); if (!s.empty()) { Indent(o, indent) << "alternate"; EmitString(o, s) << '\n'; } --indent; Indent(o, indent) << "\n"; } static void ReportEvent(raw_ostream &o, const PathDiagnosticPiece& P, const FIDMap& FM, const SourceManager &SM, const LangOptions &LangOpts, unsigned indent) { Indent(o, indent) << "\n"; ++indent; Indent(o, indent) << "kindevent\n"; // Output the location. FullSourceLoc L = P.getLocation().asLocation(); Indent(o, indent) << "location\n"; EmitLocation(o, SM, LangOpts, L, FM, indent); // Output the ranges (if any). PathDiagnosticPiece::range_iterator RI = P.ranges_begin(), RE = P.ranges_end(); if (RI != RE) { Indent(o, indent) << "ranges\n"; Indent(o, indent) << "\n"; ++indent; for (; RI != RE; ++RI) EmitRange(o, SM, LangOpts, *RI, FM, indent+1); --indent; Indent(o, indent) << "\n"; } // Output the text. assert(!P.getString().empty()); Indent(o, indent) << "extended_message\n"; Indent(o, indent); EmitString(o, P.getString()) << '\n'; // Output the short text. // FIXME: Really use a short string. Indent(o, indent) << "message\n"; EmitString(o, P.getString()) << '\n'; // Finish up. --indent; Indent(o, indent); o << "\n"; } static void ReportMacro(raw_ostream &o, const PathDiagnosticMacroPiece& P, const FIDMap& FM, const SourceManager &SM, const LangOptions &LangOpts, unsigned indent) { for (PathDiagnosticMacroPiece::const_iterator I=P.begin(), E=P.end(); I!=E; ++I) { switch ((*I)->getKind()) { default: break; case PathDiagnosticPiece::Event: ReportEvent(o, cast(**I), FM, SM, LangOpts, indent); break; case PathDiagnosticPiece::Macro: ReportMacro(o, cast(**I), FM, SM, LangOpts, indent); break; } } } static void ReportDiag(raw_ostream &o, const PathDiagnosticPiece& P, const FIDMap& FM, const SourceManager &SM, const LangOptions &LangOpts) { unsigned indent = 4; switch (P.getKind()) { case PathDiagnosticPiece::ControlFlow: ReportControlFlow(o, cast(P), FM, SM, LangOpts, indent); break; case PathDiagnosticPiece::Event: ReportEvent(o, cast(P), FM, SM, LangOpts, indent); break; case PathDiagnosticPiece::Macro: ReportMacro(o, cast(P), FM, SM, LangOpts, indent); break; } } void PlistDiagnostics::HandlePathDiagnosticImpl(const PathDiagnostic* D) { if (!D) return; if (D->empty()) { delete D; return; } // We need to flatten the locations (convert Stmt* to locations) because // the referenced statements may be freed by the time the diagnostics // are emitted. const_cast(D)->flattenLocations(); BatchedDiags.push_back(D); } void PlistDiagnostics::FlushDiagnostics(SmallVectorImpl *FilesMade) { if (flushed) return; flushed = true; // Sort the diagnostics so that they are always emitted in a deterministic // order. if (!BatchedDiags.empty()) std::sort(BatchedDiags.begin(), BatchedDiags.end(), CompareDiagnostics()); // Build up a set of FIDs that we use by scanning the locations and // ranges of the diagnostics. FIDMap FM; SmallVector Fids; const SourceManager* SM = 0; if (!BatchedDiags.empty()) SM = &(*BatchedDiags.begin())->begin()->getLocation().getManager(); for (std::vector::iterator DI = BatchedDiags.begin(), DE = BatchedDiags.end(); DI != DE; ++DI) { const PathDiagnostic *D = *DI; for (PathDiagnostic::const_iterator I=D->begin(), E=D->end(); I!=E; ++I) { AddFID(FM, Fids, SM, I->getLocation().asLocation()); for (PathDiagnosticPiece::range_iterator RI=I->ranges_begin(), RE=I->ranges_end(); RI!=RE; ++RI) { AddFID(FM, Fids, SM, RI->getBegin()); AddFID(FM, Fids, SM, RI->getEnd()); } } } // Open the file. std::string ErrMsg; llvm::raw_fd_ostream o(OutputFile.c_str(), ErrMsg); if (!ErrMsg.empty()) { llvm::errs() << "warning: could not creat file: " << OutputFile << '\n'; return; } // Write the plist header. o << "\n" "\n" "\n"; // Write the root object: a containing... // - "files", an mapping from FIDs to file names // - "diagnostics", an containing the path diagnostics o << "\n" " files\n" " \n"; for (SmallVectorImpl::iterator I=Fids.begin(), E=Fids.end(); I!=E; ++I) { o << " "; EmitString(o, SM->getFileEntryForID(*I)->getName()) << '\n'; } o << " \n" " diagnostics\n" " \n"; for (std::vector::iterator DI=BatchedDiags.begin(), DE = BatchedDiags.end(); DI!=DE; ++DI) { o << " \n" " path\n"; const PathDiagnostic *D = *DI; // Create an owning smart pointer for 'D' just so that we auto-free it // when we exit this method. llvm::OwningPtr OwnedD(const_cast(D)); o << " \n"; for (PathDiagnostic::const_iterator I=D->begin(), E=D->end(); I != E; ++I) ReportDiag(o, *I, FM, *SM, LangOpts); o << " \n"; // Output the bug type and bug category. o << " description"; EmitString(o, D->getDescription()) << '\n'; o << " category"; EmitString(o, D->getCategory()) << '\n'; o << " type"; EmitString(o, D->getBugType()) << '\n'; // Output the location of the bug. o << " location\n"; EmitLocation(o, *SM, LangOpts, D->getLocation(), FM, 2); // Output the diagnostic to the sub-diagnostic client, if any. if (SubPD) { SubPD->HandlePathDiagnostic(OwnedD.take()); SmallVector SubFilesMade; SubPD->FlushDiagnostics(SubFilesMade); if (!SubFilesMade.empty()) { o << " " << SubPD->getName() << "_files\n"; o << " \n"; for (size_t i = 0, n = SubFilesMade.size(); i < n ; ++i) o << " " << SubFilesMade[i] << "\n"; o << " \n"; } } // Close up the entry. o << " \n"; } o << " \n"; // Finish. o << "\n"; if (FilesMade) FilesMade->push_back(OutputFile); BatchedDiags.clear(); }