|  | // Copyright (c) 2013 The Chromium Authors. All rights reserved. | 
|  | // Use of this source code is governed by a BSD-style license that can be | 
|  | // found in the LICENSE file. | 
|  | // | 
|  | // This implements a Clang tool to convert all instances of std::string("") to | 
|  | // std::string(). The latter is more efficient (as std::string doesn't have to | 
|  | // take a copy of an empty string) and generates fewer instructions as well. It | 
|  | // should be run using the tools/clang/scripts/run_tool.py helper. | 
|  |  | 
|  | #include <memory> | 
|  | #include "clang/ASTMatchers/ASTMatchers.h" | 
|  | #include "clang/ASTMatchers/ASTMatchFinder.h" | 
|  | #include "clang/Basic/SourceManager.h" | 
|  | #include "clang/Frontend/FrontendActions.h" | 
|  | #include "clang/Tooling/CommonOptionsParser.h" | 
|  | #include "clang/Tooling/Refactoring.h" | 
|  | #include "clang/Tooling/Tooling.h" | 
|  | #include "llvm/Support/CommandLine.h" | 
|  |  | 
|  | using clang::ast_matchers::MatchFinder; | 
|  | using clang::ast_matchers::argumentCountIs; | 
|  | using clang::ast_matchers::bindTemporaryExpr; | 
|  | using clang::ast_matchers::constructorDecl; | 
|  | using clang::ast_matchers::constructExpr; | 
|  | using clang::ast_matchers::defaultArgExpr; | 
|  | using clang::ast_matchers::expr; | 
|  | using clang::ast_matchers::forEach; | 
|  | using clang::ast_matchers::has; | 
|  | using clang::ast_matchers::hasArgument; | 
|  | using clang::ast_matchers::hasDeclaration; | 
|  | using clang::ast_matchers::hasName; | 
|  | using clang::ast_matchers::id; | 
|  | using clang::ast_matchers::methodDecl; | 
|  | using clang::ast_matchers::newExpr; | 
|  | using clang::ast_matchers::ofClass; | 
|  | using clang::ast_matchers::stringLiteral; | 
|  | using clang::ast_matchers::varDecl; | 
|  | using clang::tooling::CommonOptionsParser; | 
|  | using clang::tooling::Replacement; | 
|  | using clang::tooling::Replacements; | 
|  |  | 
|  | namespace { | 
|  |  | 
|  | // Handles replacements for stack and heap-allocated instances, e.g.: | 
|  | // std::string a(""); | 
|  | // std::string* b = new std::string(""); | 
|  | class ConstructorCallback : public MatchFinder::MatchCallback { | 
|  | public: | 
|  | ConstructorCallback(Replacements* replacements) | 
|  | : replacements_(replacements) {} | 
|  |  | 
|  | virtual void run(const MatchFinder::MatchResult& result) override; | 
|  |  | 
|  | private: | 
|  | Replacements* const replacements_; | 
|  | }; | 
|  |  | 
|  | // Handles replacements for invocations of std::string("") in an initializer | 
|  | // list. | 
|  | class InitializerCallback : public MatchFinder::MatchCallback { | 
|  | public: | 
|  | InitializerCallback(Replacements* replacements) | 
|  | : replacements_(replacements) {} | 
|  |  | 
|  | virtual void run(const MatchFinder::MatchResult& result) override; | 
|  |  | 
|  | private: | 
|  | Replacements* const replacements_; | 
|  | }; | 
|  |  | 
|  | // Handles replacements for invocations of std::string("") in a temporary | 
|  | // context, e.g. FunctionThatTakesString(std::string("")). Note that this | 
|  | // handles implicits construction of std::string as well. | 
|  | class TemporaryCallback : public MatchFinder::MatchCallback { | 
|  | public: | 
|  | TemporaryCallback(Replacements* replacements) : replacements_(replacements) {} | 
|  |  | 
|  | virtual void run(const MatchFinder::MatchResult& result) override; | 
|  |  | 
|  | private: | 
|  | Replacements* const replacements_; | 
|  | }; | 
|  |  | 
|  | class EmptyStringConverter { | 
|  | public: | 
|  | explicit EmptyStringConverter(Replacements* replacements) | 
|  | : constructor_callback_(replacements), | 
|  | initializer_callback_(replacements), | 
|  | temporary_callback_(replacements) {} | 
|  |  | 
|  | void SetupMatchers(MatchFinder* match_finder); | 
|  |  | 
|  | private: | 
|  | ConstructorCallback constructor_callback_; | 
|  | InitializerCallback initializer_callback_; | 
|  | TemporaryCallback temporary_callback_; | 
|  | }; | 
|  |  | 
|  | void EmptyStringConverter::SetupMatchers(MatchFinder* match_finder) { | 
|  | const clang::ast_matchers::StatementMatcher& constructor_call = | 
|  | id("call", | 
|  | constructExpr( | 
|  | hasDeclaration(methodDecl(ofClass(hasName("std::basic_string")))), | 
|  | argumentCountIs(2), | 
|  | hasArgument(0, id("literal", stringLiteral())), | 
|  | hasArgument(1, defaultArgExpr()))); | 
|  |  | 
|  | // Note that expr(has()) in the matcher is significant; the Clang AST wraps | 
|  | // calls to the std::string constructor with exprWithCleanups nodes. Without | 
|  | // the expr(has()) matcher, the first and last rules would not match anything! | 
|  | match_finder->addMatcher(varDecl(forEach(expr(has(constructor_call)))), | 
|  | &constructor_callback_); | 
|  | match_finder->addMatcher(newExpr(has(constructor_call)), | 
|  | &constructor_callback_); | 
|  | match_finder->addMatcher(bindTemporaryExpr(has(constructor_call)), | 
|  | &temporary_callback_); | 
|  | match_finder->addMatcher( | 
|  | constructorDecl(forEach(expr(has(constructor_call)))), | 
|  | &initializer_callback_); | 
|  | } | 
|  |  | 
|  | void ConstructorCallback::run(const MatchFinder::MatchResult& result) { | 
|  | const clang::StringLiteral* literal = | 
|  | result.Nodes.getNodeAs<clang::StringLiteral>("literal"); | 
|  | if (literal->getLength() > 0) | 
|  | return; | 
|  |  | 
|  | const clang::CXXConstructExpr* call = | 
|  | result.Nodes.getNodeAs<clang::CXXConstructExpr>("call"); | 
|  | clang::CharSourceRange range = | 
|  | clang::CharSourceRange::getTokenRange(call->getParenOrBraceRange()); | 
|  | replacements_->insert(Replacement(*result.SourceManager, range, "")); | 
|  | } | 
|  |  | 
|  | void InitializerCallback::run(const MatchFinder::MatchResult& result) { | 
|  | const clang::StringLiteral* literal = | 
|  | result.Nodes.getNodeAs<clang::StringLiteral>("literal"); | 
|  | if (literal->getLength() > 0) | 
|  | return; | 
|  |  | 
|  | const clang::CXXConstructExpr* call = | 
|  | result.Nodes.getNodeAs<clang::CXXConstructExpr>("call"); | 
|  | replacements_->insert(Replacement(*result.SourceManager, call, "")); | 
|  | } | 
|  |  | 
|  | void TemporaryCallback::run(const MatchFinder::MatchResult& result) { | 
|  | const clang::StringLiteral* literal = | 
|  | result.Nodes.getNodeAs<clang::StringLiteral>("literal"); | 
|  | if (literal->getLength() > 0) | 
|  | return; | 
|  |  | 
|  | const clang::CXXConstructExpr* call = | 
|  | result.Nodes.getNodeAs<clang::CXXConstructExpr>("call"); | 
|  | // Differentiate between explicit and implicit calls to std::string's | 
|  | // constructor. An implicitly generated constructor won't have a valid | 
|  | // source range for the parenthesis. We do this because the matched expression | 
|  | // for |call| in the explicit case doesn't include the closing parenthesis. | 
|  | clang::SourceRange range = call->getParenOrBraceRange(); | 
|  | if (range.isValid()) { | 
|  | replacements_->insert(Replacement(*result.SourceManager, literal, "")); | 
|  | } else { | 
|  | replacements_->insert( | 
|  | Replacement(*result.SourceManager, | 
|  | call, | 
|  | literal->isWide() ? "std::wstring()" : "std::string()")); | 
|  | } | 
|  | } | 
|  |  | 
|  | }  // namespace | 
|  |  | 
|  | static llvm::cl::extrahelp common_help(CommonOptionsParser::HelpMessage); | 
|  |  | 
|  | int main(int argc, const char* argv[]) { | 
|  | llvm::cl::OptionCategory category("EmptyString Tool"); | 
|  | CommonOptionsParser options(argc, argv, category); | 
|  | clang::tooling::ClangTool tool(options.getCompilations(), | 
|  | options.getSourcePathList()); | 
|  |  | 
|  | Replacements replacements; | 
|  | EmptyStringConverter converter(&replacements); | 
|  | MatchFinder match_finder; | 
|  | converter.SetupMatchers(&match_finder); | 
|  |  | 
|  | std::unique_ptr<clang::tooling::FrontendActionFactory> frontend_factory = | 
|  | clang::tooling::newFrontendActionFactory(&match_finder); | 
|  | int result = tool.run(frontend_factory.get()); | 
|  | if (result != 0) | 
|  | return result; | 
|  |  | 
|  | // Each replacement line should have the following format: | 
|  | // r:<file path>:<offset>:<length>:<replacement text> | 
|  | // Only the <replacement text> field can contain embedded ":" characters. | 
|  | // TODO(dcheng): Use a more clever serialization. Ideally we'd use the YAML | 
|  | // serialization and then use clang-apply-replacements, but that would require | 
|  | // copying and pasting a larger amount of boilerplate for all Chrome clang | 
|  | // tools. | 
|  | llvm::outs() << "==== BEGIN EDITS ====\n"; | 
|  | for (const auto& r : replacements) { | 
|  | llvm::outs() << "r:" << r.getFilePath() << ":" << r.getOffset() << ":" | 
|  | << r.getLength() << ":" << r.getReplacementText() << "\n"; | 
|  | } | 
|  | llvm::outs() << "==== END EDITS ====\n"; | 
|  |  | 
|  | return 0; | 
|  | } |