forked from scrt/avcleaner
-
Notifications
You must be signed in to change notification settings - Fork 1
/
MatchHandler.h
160 lines (133 loc) · 6.77 KB
/
MatchHandler.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
//
// Created by vladimir on 28.09.19.
//
#ifndef AVCLEANER_MATCHHANDLER_H
#define AVCLEANER_MATCHHANDLER_H
#include <vector>
#include <string>
#include <memory>
#include "llvm/Support/raw_ostream.h"
#include "llvm/Support/CommandLine.h"
#include "llvm/ADT/StringRef.h"
#include "llvm/ADT/ArrayRef.h"
#include "clang/Rewrite/Core/Rewriter.h"
#include "clang/Tooling/Tooling.h"
#include "clang/Tooling/CommonOptionsParser.h"
#include "clang/Frontend/FrontendAction.h"
#include "clang/Frontend/CompilerInstance.h"
#include "clang/Basic/SourceManager.h"
#include "clang/ASTMatchers/ASTMatchers.h"
#include "clang/ASTMatchers/ASTMatchFinder.h"
#include "clang/AST/Type.h"
#include "clang/AST/Decl.h"
#include "clang/AST/ASTContext.h"
#include "clang/AST/ASTConsumer.h"
#include "clang/AST/AST.h"
#include "clang/AST/ASTConsumer.h"
#include "clang/AST/RecursiveASTVisitor.h"
#include "clang/Frontend/ASTConsumers.h"
#include "clang/Frontend/CompilerInstance.h"
#include "clang/Frontend/FrontendActions.h"
#include "clang/Rewrite/Core/Rewriter.h"
#include "clang/Tooling/CommonOptionsParser.h"
#include "clang/Tooling/Tooling.h"
#include "llvm/Support/raw_ostream.h"
class MatchHandler : public clang::ast_matchers::MatchFinder::MatchCallback {
public:
using MatchResult = clang::ast_matchers::MatchFinder::MatchResult;
MatchHandler(clang::Rewriter *rewriter);
void run(const MatchResult &Result) override; // callback function that runs when a Match is found.
/**
* strip metacharacters decorating a string.
* For instance, L"ntdll" -> ntdll
* @param Argument the string to be cleaned.
*/
static void cleanParameter(std::string &Argument);
/**
* used to replace a string literal by a variable's identifier
* must not collide with existing identifiers.
* Format: 12-first characters, letters only + random part
* TODO: remember allocated identifiers for collision prevention
* TODO: extract constants into readable identifiers.
* @param StrLiteral the string literal
*/
static std::string translateStringToIdentifier(const std::string &StrLiteral);
/**
* @brief declares and instantiate a variable holding a string that was moved out from a function's arguments.
* @param StringIdentifier the new variable identifier.
* @param StringValue the actual value of the string literal.
* @return the generated code snippet.
*/
static std::string
generateVariableDeclaration(const std::string &StringIdentifier, std::string &StringValue);
private:
clang::Rewriter *ASTRewriter; // an instance to a Rewriter to manage changes to the AST.
// climb the list of parents recursively until it finds a useful node (i.e. not Cast-like nodes).
bool climbParentsIgnoreCast(const clang::StringLiteral &NodeString, clang::ast_type_traits::DynTypedNode node,
clang::ASTContext *pContext, uint64_t iterations);
/**
* gets a list of all the parent nodes of a given StringLiteral node, ignoring Cast-like nodes.
* @param NodeString a StringLiteral node
* @param Node Holds the current parent node, empty at first iteration.
* @param Context ASTContext of the initial node.
* @param CurrentParents Accumulator of encountered parent nodes.
* @param Iterations Number of iterations, used to prevent stack overflow.
* @return a vector of strings of encountered parents NodeKind.
*/
static std::vector<std::string>
getNodeParents(const clang::StringLiteral &NodeString, clang::ast_type_traits::DynTypedNode Node,
clang::ASTContext *Context, std::vector<std::string> &CurrentParents, uint64_t Iterations);
/**
* @brief decides what to do according to the location in the AST of the identified string literal.
* @param pLiteral the identified string literal.
* @param pContext ASTContext of the string literal pLiteral.
* @param node dummy node used to store the string literal successive parent.
*/
void handleStringInContext(const clang::StringLiteral *pLiteral, clang::ASTContext *pContext,
clang::ast_type_traits::DynTypedNode node);
/**
*
* @param pLiteral a string occurrence to be encrypted
* @param pContext an instance of ASTContext
* @param node the AST node that makes use of the string pLiteral
*/
void handleCallExpr(const clang::StringLiteral *pLiteral, clang::ASTContext *pContext,
clang::ast_type_traits::DynTypedNode node);
/**
* @brief generates a random string of size Length.
* @param Length desired length of the generated string.
* @return a random string of size Length.
*/
static std::string randomString(unsigned long Length);
/**
* @brief Finds some free space to inject code that must run before the string literals usages.
* @param Context an ASTContext instance.
* @param Parent the current parent node of the string literal. Empty node for the first iteration.
* @param Literal a string literal.
* @param Iterations used to prevent a recursion infinite loop.
* @return the location of a nice injection spot.
*/
static clang::SourceRange
findInjectionSpot(clang::ASTContext *Context, clang::ast_type_traits::DynTypedNode Parent,
const clang::StringLiteral &Literal, bool IsGlobal, uint64_t Iterations);
const static uint64_t CLIMB_PARENTS_MAX_ITER = 1000; // fail safe to prevent a recursion loop when climbing the list of parents.
/**
* offers a chance to bail out from the refactoring process if the string literal is found in an unpatchable location.
* @param FunctionName
* @return true if the FunctionName is not blacklisted.
*/
static bool isBlacklistedFunction(const clang::CallExpr *FunctionName);
void handleInitListExpr(const clang::StringLiteral *pLiteral, clang::ASTContext *pContext,
clang::ast_type_traits::DynTypedNode node);
bool shouldAbort(const clang::StringLiteral *pLiteral, clang::ASTContext *pContext, clang::SourceRange string);
std::vector<const clang::StringLiteral*> EncounteredStrings; // collections of refactored String literals.
static bool isStringLiteralInGlobal(clang::ASTContext *Context, const clang::StringLiteral &Literal);
bool replaceStringLiteral(const clang::StringLiteral *pLiteral, clang::ASTContext *pContext,
clang::SourceRange range,
const std::string& string);
bool insertVariableDeclaration(const clang::StringLiteral *pLiteral, clang::ASTContext *pContext,
clang::SourceRange range, const std::string& string);
bool handleExpr(const clang::StringLiteral *pLiteral, clang::ASTContext *pContext,
clang::ast_type_traits::DynTypedNode node);
};
#endif //AVCLEANER_MATCHHANDLER_H