/***************************************************Project Mutator****************************************************/ //-*-c++-*- /*first line intentionally left blank.*/ /*Copyright (C) 2017 Farzad Sadeghi This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.*/ /*code structure inspired by Eli Bendersky's tutorial on Rewriters.*/ /**********************************************************************************************************************/ /*FIXME-all classes should use replacements.*/ //@DEVI-FIXME-will mess up macros /**********************************************************************************************************************/ /*included modules*/ /*project headers*/ #include "../mutator_aux.h" /*standard headers*/ #include #include #include #include #include #include /*LLVM headers*/ #include "clang/AST/AST.h" #include "clang/AST/ASTConsumer.h" #include "clang/ASTMatchers/ASTMatchers.h" #include "clang/ASTMatchers/ASTMatchFinder.h" #include "clang/Basic/LLVM.h" #include "clang/CodeGen/CodeGenAction.h" #include "clang/CodeGen/BackendUtil.h" #include "clang/Frontend/CompilerInstance.h" #include "clang/Frontend/FrontendActions.h" #include "clang/Lex/Lexer.h" #include "clang/Tooling/CommonOptionsParser.h" #include "clang/Tooling/Tooling.h" #include "clang/Rewrite/Core/Rewriter.h" #include "llvm/ADT/ArrayRef.h" #include "llvm/IR/IRBuilder.h" #include "llvm/IR/LLVMContext.h" #include "llvm/IR/Module.h" #include "llvm/IR/BasicBlock.h" #include "llvm/IR/Function.h" #include "llvm/IR/Function.h" #include "llvm/Support/raw_ostream.h" #include "llvm/Linker/Linker.h" /**********************************************************************************************************************/ /*used namespaces*/ using namespace llvm; using namespace clang; using namespace clang::ast_matchers; using namespace clang::driver; using namespace clang::tooling; /**********************************************************************************************************************/ /*global vars*/ static llvm::cl::OptionCategory MatcherSampleCategory("Matcher Sample"); /**********************************************************************************************************************/ //#define DBG /**********************************************************************************************************************/ // kill all comments /**********************************************************************************************************************/ // kill all whitespace, add , and ; /**********************************************************************************************************************/ class CalledFunc : public MatchFinder::MatchCallback { public: CalledFunc(Rewriter &Rewrite) : Rewrite(Rewrite) {} virtual void run(const MatchFinder::MatchResult &MR) { if (MR.Nodes.getNodeAs("calledfunc") != nullptr) { const CallExpr *CE = MR.Nodes.getNodeAs("calledfunc"); std::string name = CE->getDirectCallee()->getNameInfo().getAsString(); std::size_t hash = std::hash{}(name); std::string newname = "ID" + std::to_string(hash); #ifdef DBG std::cout << "CallExpr name: " << name << " Hash: " << hash << " New ID: " << newname << "\n"; #endif auto dummy = Rewrite.getRewrittenText(SourceRange(CE->getLocStart(), CE->getRParenLoc())); auto LParenOffset = dummy.find("("); dummy = Rewrite.getRewrittenText(SourceRange(CE->getLocStart(), CE->getLocStart().getLocWithOffset(LParenOffset - 1U))); Rewrite.ReplaceText(SourceRange(CE->getLocStart(), CE->getLocStart().getLocWithOffset(LParenOffset - 1U)), StringRef(newname)); } } private: Rewriter &Rewrite; }; /**********************************************************************************************************************/ class CalledVar : public MatchFinder::MatchCallback { public: CalledVar (Rewriter &Rewrite) : Rewrite(Rewrite) {} virtual void run(const MatchFinder::MatchResult &MR) { if (MR.Nodes.getNodeAs("calledvar") != nullptr) { const DeclRefExpr* DRE = MR.Nodes.getNodeAs("calledvar"); auto name = DRE->getNameInfo().getAsString(); std::size_t hash = std::hash{}(name); std::string newname = "ID" + std::to_string(hash); #ifdef DBG std::cout << "DeclRefExpr name: " << name << " Hash: " << hash << " New ID: " << newname << "\n"; #endif SourceLocation SL = DRE->getNameInfo().getBeginLoc(); SourceLocation SLE = DRE->getNameInfo().getEndLoc(); Rewrite.ReplaceText(SourceRange(SL, SLE), StringRef(newname)); } } private: Rewriter &Rewrite; }; /**********************************************************************************************************************/ class FuncDecl : public MatchFinder::MatchCallback { public: FuncDecl (Rewriter &Rewrite) : Rewrite (Rewrite) {} virtual void run(const MatchFinder::MatchResult &MR) { if (MR.Nodes.getNodeAs("funcdecl") != nullptr) { const FunctionDecl* FD = MR.Nodes.getNodeAs("funcdecl"); std::string funcname = FD->getNameInfo().getAsString(); if (funcname == "main") return void(); std::size_t hash = std::hash{}(funcname); std::string newname = "ID" + std::to_string(hash); #ifdef DBG std::cout << "Function name: " << funcname << " Hash: " << hash << " New ID: " << newname << "\n"; #endif SourceLocation SL = FD->getNameInfo().getBeginLoc(); SourceLocation SLE = FD->getNameInfo().getEndLoc(); Rewrite.ReplaceText(SourceRange(SL, SLE), StringRef(newname)); } } private: Rewriter &Rewrite; }; /**********************************************************************************************************************/ class VDecl : public MatchFinder::MatchCallback { public: VDecl (Rewriter &Rewrite) : Rewrite (Rewrite) {} virtual void run(const MatchFinder::MatchResult &MR) { if (MR.Nodes.getNodeAs("vardecl") != nullptr) { const VarDecl* VD = MR.Nodes.getNodeAs("vardecl"); std::string varname = VD->getIdentifier()->getName().str(); std::size_t hash = std::hash{}(varname); std::string newname = "ID" + std::to_string(hash); #ifdef DBG std::cout << "Var name: " << varname << " Hash: " << hash << " New ID: " << newname << "\n"; #endif SourceLocation SL = VD->getLocation(); SourceLocation SLE; const clang::Expr* EXP = nullptr; if (MR.Nodes.getNodeAs("expr") !=nullptr) { EXP = MR.Nodes.getNodeAs("expr"); SLE = EXP->getExprLoc(); } else { SLE = VD->getLocEnd(); } //@devi-FIXME-cluncky Rewrite.ReplaceText(SourceRange(SL, SL.getLocWithOffset(VD->getIdentifier()->getLength() - 1)), StringRef(newname)); } } private: Rewriter &Rewrite; }; /**********************************************************************************************************************/ class ClassDecl : public MatchFinder::MatchCallback { public: ClassDecl (Rewriter &Rewrite) : Rewrite(Rewrite) {} virtual void run(const MatchFinder::MatchResult &MR) { if (MR.Nodes.getNodeAs("classdecl") != nullptr) { const RecordDecl* RD = MR.Nodes.getNodeAs("classdecl"); if (RD->isAnonymousStructOrUnion()) return void(); if (RD->isInjectedClassName()) {} else {return void();} auto TD = RD->getCanonicalDecl(); std::string varname = RD->getIdentifier()->getName().str(); std::size_t hash = std::hash{}(varname); std::string newname = "ID" + std::to_string(hash); #ifdef DBG std::cout << "Record name: " << varname << " Hash: " << hash << " New ID: " << newname << "\n"; #endif SourceLocation SL = RD->getLocation(); SourceLocation SLE = RD->getLocEnd(); std::string dummy = Rewrite.getRewrittenText(SourceRange(SL, SLE)); Rewrite.ReplaceText(SourceRange(SL, SLE), StringRef(newname)); } } private: Rewriter &Rewrite; }; /**********************************************************************************************************************/ class PPInclusion : public PPCallbacks { public: explicit PPInclusion (SourceManager *SM, Rewriter *Rewrite) : SM(*SM), Rewrite(*Rewrite) {} virtual void MacroDefined(const Token &MacroNameTok, const MacroDirective *MD) { const MacroInfo* MI = MD->getMacroInfo(); SourceLocation SL = MacroNameTok.getLocation(); if (!SM.isInMainFile(SL)) return void(); if (!SM.isWrittenInMainFile(SL)) return void(); CheckSLValidity(SL); std::string macroname = MacroNameTok.getIdentifierInfo()->getName().str(); std::size_t hash = std::hash{}(macroname); std::string newname = "ID" + std::to_string(hash); #ifdef DBG std::cout << "Macro name: " << macroname << " Hash: " << hash << " New ID: " << newname << "\n"; #endif //std::string dummy = Rewrite.getRewrittenText(SourceRange(MacroNameTok.getLocation(), MacroNameTok.getLocation().getLocWithOffset(MacroNameTok.getLength()))); //std::cout << dummy << "\n"; Rewrite.ReplaceText(SourceRange(MacroNameTok.getLocation(), MacroNameTok.getLocation().getLocWithOffset(MacroNameTok.getLength())), newname); } private: const SourceManager &SM; Rewriter &Rewrite; }; /**********************************************************************************************************************/ class BlankDiagConsumer : public clang::DiagnosticConsumer { public: BlankDiagConsumer() = default; virtual ~BlankDiagConsumer() {} virtual void HandleDiagnostic(DiagnosticsEngine::Level DiagLevel, const Diagnostic &Info) override {} }; /**********************************************************************************************************************/ class MyASTConsumer : public ASTConsumer { public: MyASTConsumer(Rewriter &R) : funcDeclHandler(R), HandlerForVar(R), HandlerForClass(R), HandlerForCalledFunc(R), HandlerForCalledVar(R) { Matcher.addMatcher(functionDecl().bind("funcdecl"), &funcDeclHandler); Matcher.addMatcher(varDecl(anyOf(unless(hasDescendant(expr(anything()))), hasDescendant(expr(anything()).bind("expr")))).bind("vardecl"), &HandlerForVar); Matcher.addMatcher(recordDecl(isClass()).bind("classdecl"), &HandlerForClass); //Matcher.addMatcher(callExpr().bind("calledfunc"), &HandlerForCalledFunc); Matcher.addMatcher(declRefExpr().bind("calledvar"), &HandlerForCalledVar); } void HandleTranslationUnit(ASTContext &Context) override { Matcher.matchAST(Context); } private: FuncDecl funcDeclHandler; VDecl HandlerForVar; ClassDecl HandlerForClass; CalledFunc HandlerForCalledFunc; CalledVar HandlerForCalledVar; MatchFinder Matcher; }; /**********************************************************************************************************************/ class ObfFrontendAction : public ASTFrontendAction { public: ObfFrontendAction() {} ~ObfFrontendAction() { delete BDCProto; delete tee; } void EndSourceFileAction() override { std::error_code EC; std::string OutputFilename = "./obfuscator-tee"; TheRewriter.getEditBuffer(TheRewriter.getSourceMgr().getMainFileID()).write(llvm::outs()); tee = new raw_fd_ostream(StringRef(OutputFilename), EC, sys::fs::F_None); TheRewriter.getEditBuffer(TheRewriter.getSourceMgr().getMainFileID()).write(*tee); } std::unique_ptr CreateASTConsumer(CompilerInstance &CI, StringRef file) override { CI.getPreprocessor().addPPCallbacks(llvm::make_unique(&CI.getSourceManager(), &TheRewriter)); DiagnosticsEngine &DE = CI.getPreprocessor().getDiagnostics(); DE.setClient(BDCProto, false); TheRewriter.setSourceMgr(CI.getSourceManager(), CI.getLangOpts()); return llvm::make_unique(TheRewriter); } private: BlankDiagConsumer* BDCProto = new BlankDiagConsumer; Rewriter TheRewriter; raw_ostream *tee = &llvm::outs(); }; /**********************************************************************************************************************/ class CommentWiper { public: CommentWiper(std::vector SourceList) : sourcelist(SourceList) {} int run(void) { for (auto &filepath : sourcelist) { //std::regex comment1("//.+"); //std::regex comment2("/\\*.+\\*/"); //std::regex comment2("/\\*[^]+\\*/"); //std::regex multibegin("/\\*.+(?!\\*/)"); //std::regex multiend("(? sourcelist; }; /**********************************************************************************************************************/ class WhitespaceWarper { public: WhitespaceWarper(std::vector SourceList) : sourcelist(SourceList) {} int run(void) { for (auto &filepath : sourcelist) { std::ifstream sourcefile; sourcefile.open("../test/bruisertest/obfuscator-tee"); std::ofstream dupe; dupe.open("./dupe.cpp"); std::string line; while (std::getline(sourcefile, line)) { for (auto &character : line) { if (std::to_string(character) == "\t") { dupe << "\t"; } else if (std::to_string(character) == "\n") { } else if (std::to_string(character) == " ") { dupe << " "; } else { dupe << character; } } } dupe.close(); } return 0; } private: std::vector sourcelist; }; /**********************************************************************************************************************/ /*Main*/ int main(int argc, const char **argv) { CommonOptionsParser op(argc, argv, MatcherSampleCategory); const std::vector &SourcePathList = op.getSourcePathList(); ClangTool Tool(op.getCompilations(), op.getSourcePathList()); int ret = Tool.run(newFrontendActionFactory().get()); WhitespaceWarper WW(SourcePathList); //WW.run(); CommentWiper CW(SourcePathList); CW.run(); return ret; } /**********************************************************************************************************************/ /*last line intentionally left blank.*/