Static Value-Flow Analysis
Loading...
Searching...
No Matches
AEDetector.cpp
Go to the documentation of this file.
1//===- AEDetector.cpp -- Vulnerability Detectors---------------------------------//
2//
3// SVF: Static Value-Flow Analysis
4//
5// Copyright (C) <2013-> <Yulei Sui>
6//
7
8// This program is free software: you can redistribute it and/or modify
9// it under the terms of the GNU Affero General Public License as published by
10// the Free Software Foundation, either version 3 of the License, or
11// (at your option) any later version.
12
13// This program is distributed in the hope that it will be useful,
14// but WITHOUT ANY WARRANTY; without even the implied warranty of
15// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16// GNU Affero General Public License for more details.
17
18// You should have received a copy of the GNU Affero General Public License
19// along with this program. If not, see <http://www.gnu.org/licenses/>.
20//
21//===----------------------------------------------------------------------===//
22
23
24//
25// Created by Jiawei Wang on 2024/8/20.
26//
27
29#include <AE/Svfexe/AbsExtAPI.h>
31
32using namespace SVF;
33
45{
46 if (!SVFUtil::isa<CallICFGNode>(node))
47 {
48 // Handle non-call nodes by analyzing GEP instructions
49 for (const SVFStmt* stmt : node->getSVFStmts())
50 {
51 if (const GepStmt* gep = SVFUtil::dyn_cast<GepStmt>(stmt))
52 {
53 SVFIR* svfir = PAG::getPAG();
54 NodeID lhs = gep->getLHSVarID();
55 NodeID rhs = gep->getRHSVarID();
56
57 // Update the GEP object offset from its base
58 updateGepObjOffsetFromBase(as[lhs].getAddrs(), as[rhs].getAddrs(), as.getByteOffset(gep));
59
61 AddressValue objAddrs = as[gep->getRHSVarID()].getAddrs();
62 for (const auto& addr : objAddrs)
63 {
65 u32_t size = 0;
66
68 {
69 size = svfir->getBaseObject(objId)->getByteSizeOfObj();
70 }
71 else
72 {
74 for (const SVFStmt* stmt2 : addrNode->getSVFStmts())
75 {
76 if (const AddrStmt* addrStmt = SVFUtil::dyn_cast<AddrStmt>(stmt2))
77 {
78 size = as.getAllocaInstByteSize(addrStmt);
79 }
80 }
81 }
82
83 // Calculate access offset and check for potential overflow
85 if (accessOffset.ub().getIntNumeral() >= size)
86 {
87 AEException bug(stmt->toString());
88 addBugToReporter(bug, stmt->getICFGNode());
89 }
90 }
91 }
92 }
93 }
94 else
95 {
96 // Handle call nodes by checking for external API calls
97 const CallICFGNode* callNode = SVFUtil::cast<CallICFGNode>(node);
98 if (SVFUtil::isExtCall(callNode->getCalledFunction()))
99 {
101 }
102 }
103}
104
105
114{
115 // get function name
116 std::string funcName = callNode->getCalledFunction()->getName();
117 if (funcName == "SAFE_BUFACCESS")
118 {
119 // void SAFE_BUFACCESS(void* data, int size);
121 if (callNode->arg_size() < 2)
122 return;
125 callNode);
126 u32_t size_id = callNode->getArgument(1)->getId();
127 IntervalValue val = as[size_id].getInterval();
128 if (val.isBottom())
129 {
130 val = IntervalValue(0);
131 assert(false && "SAFE_BUFACCESS size is bottom");
132 }
133 const SVFVar* arg0Val = callNode->getArgument(0);
135 if (isSafe)
136 {
137 std::cout << "safe buffer access success: " << callNode->toString()
138 << std::endl;
139 return;
140 }
141 else
142 {
143 std::string err_msg = "this SAFE_BUFACCESS should be a safe access but detected buffer overflow. Pos: ";
144 err_msg += callNode->getSourceLoc();
145 std::cerr << err_msg << std::endl;
146 assert(false);
147 }
148 }
149 else if (funcName == "UNSAFE_BUFACCESS")
150 {
151 // handle other stub functions
152 //void UNSAFE_BUFACCESS(void* data, int size);
154 if (callNode->arg_size() < 2) return;
156 u32_t size_id = callNode->getArgument(1)->getId();
157 IntervalValue val = as[size_id].getInterval();
158 if (val.isBottom())
159 {
160 assert(false && "UNSAFE_BUFACCESS size is bottom");
161 }
162 const SVFVar* arg0Val = callNode->getArgument(0);
164 if (!isSafe)
165 {
166 std::cout << "detect buffer overflow success: " << callNode->toString() << std::endl;
167 return;
168 }
169 else
170 {
171 std::string err_msg = "this UNSAFE_BUFACCESS should be a buffer overflow but not detected. Pos: ";
172 err_msg += callNode->getSourceLoc();
173 std::cerr << err_msg << std::endl;
174 assert(false);
175 }
176 }
177}
178
186{
187 extAPIBufOverflowCheckRules["llvm_memcpy_p0i8_p0i8_i64"] = {{0, 2}, {1, 2}};
188 extAPIBufOverflowCheckRules["llvm_memcpy_p0_p0_i64"] = {{0, 2}, {1, 2}};
189 extAPIBufOverflowCheckRules["llvm_memcpy_p0i8_p0i8_i32"] = {{0, 2}, {1, 2}};
190 extAPIBufOverflowCheckRules["llvm_memcpy"] = {{0, 2}, {1, 2}};
191 extAPIBufOverflowCheckRules["llvm_memmove"] = {{0, 2}, {1, 2}};
192 extAPIBufOverflowCheckRules["llvm_memmove_p0i8_p0i8_i64"] = {{0, 2}, {1, 2}};
193 extAPIBufOverflowCheckRules["llvm_memmove_p0_p0_i64"] = {{0, 2}, {1, 2}};
194 extAPIBufOverflowCheckRules["llvm_memmove_p0i8_p0i8_i32"] = {{0, 2}, {1, 2}};
195 extAPIBufOverflowCheckRules["__memcpy_chk"] = {{0, 2}, {1, 2}};
196 extAPIBufOverflowCheckRules["memmove"] = {{0, 2}, {1, 2}};
197 extAPIBufOverflowCheckRules["bcopy"] = {{0, 2}, {1, 2}};
198 extAPIBufOverflowCheckRules["memccpy"] = {{0, 3}, {1, 3}};
199 extAPIBufOverflowCheckRules["__memmove_chk"] = {{0, 2}, {1, 2}};
200 extAPIBufOverflowCheckRules["llvm_memset"] = {{0, 2}};
201 extAPIBufOverflowCheckRules["llvm_memset_p0i8_i32"] = {{0, 2}};
202 extAPIBufOverflowCheckRules["llvm_memset_p0i8_i64"] = {{0, 2}};
203 extAPIBufOverflowCheckRules["llvm_memset_p0_i64"] = {{0, 2}};
204 extAPIBufOverflowCheckRules["__memset_chk"] = {{0, 2}};
205 extAPIBufOverflowCheckRules["wmemset"] = {{0, 2}};
206 extAPIBufOverflowCheckRules["strncpy"] = {{0, 2}, {1, 2}};
207 extAPIBufOverflowCheckRules["iconv"] = {{1, 2}, {3, 4}};
208}
209
220 const CallICFGNode* call)
221{
222 assert(call->getCalledFunction() && "FunObjVar* is nullptr");
223
225
226 // Determine the type of external memory API
227 for (const std::string &annotation : ExtAPI::getExtAPI()->getExtFuncAnnotations(call->getCalledFunction()))
228 {
229 if (annotation.find("MEMCPY") != std::string::npos)
231 if (annotation.find("MEMSET") != std::string::npos)
233 if (annotation.find("STRCPY") != std::string::npos)
235 if (annotation.find("STRCAT") != std::string::npos)
237 }
238
239 // Apply buffer overflow checks based on the determined API type
241 {
242 if (extAPIBufOverflowCheckRules.count(call->getCalledFunction()->getName()) == 0)
243 {
244 SVFUtil::errs() << "Warning: " << call->getCalledFunction()->getName() << " is not in the rules, please implement it\n";
245 return;
246 }
247 std::vector<std::pair<u32_t, u32_t>> args =
249 for (auto arg : args)
250 {
251 IntervalValue offset = as[call->getArgument(arg.second)->getId()].getInterval() - IntervalValue(1);
252 const SVFVar* argVar = call->getArgument(arg.first);
254 {
255 AEException bug(call->toString());
256 addBugToReporter(bug, call);
257 }
258 }
259 }
260 else if (extType == AbsExtAPI::MEMSET)
261 {
262 if (extAPIBufOverflowCheckRules.count(call->getCalledFunction()->getName()) == 0)
263 {
264 SVFUtil::errs() << "Warning: " << call->getCalledFunction()->getName() << " is not in the rules, please implement it\n";
265 return;
266 }
267 std::vector<std::pair<u32_t, u32_t>> args =
269 for (auto arg : args)
270 {
271 IntervalValue offset = as[call->getArgument(arg.second)->getId()].getInterval() - IntervalValue(1);
272 const SVFVar* argVar = call->getArgument(arg.first);
274 {
275 AEException bug(call->toString());
276 addBugToReporter(bug, call);
277 }
278 }
279 }
280 else if (extType == AbsExtAPI::STRCPY)
281 {
282 if (!detectStrcpy(as, call))
283 {
284 AEException bug(call->toString());
285 addBugToReporter(bug, call);
286 }
287 }
288 else if (extType == AbsExtAPI::STRCAT)
289 {
290 if (!detectStrcat(as, call))
291 {
292 AEException bug(call->toString());
293 addBugToReporter(bug, call);
294 }
295 }
296 else
297 {
298 // Handle other cases
299 }
300}
301
314{
315 SVFIR* svfir = PAG::getPAG();
316 auto obj = svfir->getGNode(objId);
317
318 // if the object is a BaseObjVar, return the byte offset directly
319 if (SVFUtil::isa<BaseObjVar>(obj))
320 {
321 return as.getByteOffset(gep);
322 }
323 else if (SVFUtil::isa<GepObjVar>(obj))
324 {
325 // if the object is a GepObjVar, return the offset from the base object
326 return getGepObjOffsetFromBase(SVFUtil::cast<GepObjVar>(obj)) + as.getByteOffset(gep);
327 }
328 else
329 {
330 assert(SVFUtil::isa<DummyObjVar>(obj) && "Unknown object type");
331 return IntervalValue::top();
332 }
333}
334
346{
347 SVFIR* svfir = PAG::getPAG();
348
349 for (const auto& objAddr : objAddrs)
350 {
352 auto obj = svfir->getGNode(objId);
353 // if the object is a BaseObjVar, add the offset directly
354 if (SVFUtil::isa<BaseObjVar>(obj))
355 {
356 for (const auto& gepAddr : gepAddrs)
357 {
359 const GepObjVar* gepObjVar = SVFUtil::cast<GepObjVar>(svfir->getGNode(gepObj));
361 }
362 }
363 else if (SVFUtil::isa<GepObjVar>(obj))
364 {
365 // if the object is a GepObjVar, add the offset from the base object
366 const GepObjVar* objVar = SVFUtil::cast<GepObjVar>(obj);
367 for (const auto& gepAddr : gepAddrs)
368 {
370 const GepObjVar* gepObjVar = SVFUtil::cast<GepObjVar>(svfir->getGNode(gepObj));
372 {
376 }
377 else
378 {
379 assert(false && "GEP RHS object has no offset from base");
380 }
381 }
382 }
383 }
384}
385
403
415{
416 const std::vector<std::string> strcatGroup = {"__strcat_chk", "strcat", "__wcscat_chk", "wcscat"};
417 const std::vector<std::string> strncatGroup = {"__strncat_chk", "strncat", "__wcsncat_chk", "wcsncat"};
418
419 if (std::find(strcatGroup.begin(), strcatGroup.end(), call->getCalledFunction()->getName()) != strcatGroup.end())
420 {
421 const SVFVar* arg0Val = call->getArgument(0);
422 const SVFVar* arg1Val = call->getArgument(1);
427 }
428 else if (std::find(strncatGroup.begin(), strncatGroup.end(), call->getCalledFunction()->getName()) != strncatGroup.end())
429 {
430 const SVFVar* arg0Val = call->getArgument(0);
431 const SVFVar* arg2Val = call->getArgument(2);
432 IntervalValue arg2Num = as[arg2Val->getId()].getInterval();
436 }
437 else
438 {
439 assert(false && "Unknown strcat function, please add it to strcatGroup or strncatGroup");
440 abort();
441 }
442}
443
456{
457 SVFIR* svfir = PAG::getPAG();
458 NodeID value_id = value->getId();
459
460 assert(as[value_id].isAddr());
461 for (const auto& addr : as[value_id].getAddrs())
462 {
464 u32_t size = 0;
465
466 // if the object is a constant size object, get the size directly
468 {
469 size = svfir->getBaseObject(objId)->getByteSizeOfObj();
470 }
471 else
472 {
473 // if the object is not a constant size object, get the size from the addrStmt
474 const ICFGNode* addrNode = svfir->getBaseObject(objId)->getICFGNode();
475 for (const SVFStmt* stmt2 : addrNode->getSVFStmts())
476 {
477 if (const AddrStmt* addrStmt = SVFUtil::dyn_cast<AddrStmt>(stmt2))
478 {
479 size = as.getAllocaInstByteSize(addrStmt);
480 }
481 }
482 }
483
485 // if the object is a GepObjVar, get the offset from the base object
486 if (SVFUtil::isa<GepObjVar>(svfir->getGNode(objId)))
487 {
488 offset = getGepObjOffsetFromBase(SVFUtil::cast<GepObjVar>(svfir->getGNode(objId))) + len;
489 }
490 else
491 {
492 // if the object is a BaseObjVar, get the offset directly
493 offset = len;
494 }
495 // if the offset is greater than the size, return false
496 if (offset.ub().getIntNumeral() >= size)
497 {
498 return false;
499 }
500 }
501 return true;
502}
buffer offset
Definition cJSON.cpp:1113
Exception class for handling errors in Abstract Execution.
Definition AEDetector.h:107
IntervalValue getStrlen(AbstractState &as, const SVF::SVFVar *strValue)
Calculates the length of a string.
ExtAPIType
Enumeration of external API types.
Definition AbsExtAPI.h:52
static AbstractInterpretation & getAEInstance()
AbstractState & getAbsStateFromTrace(const ICFGNode *node)
Set< const CallICFGNode * > checkpoints
static u32_t getInternalID(u32_t idx)
Return the internal index if idx is an address otherwise return the value of idx.
const ICFGNode * getICFGNode() const
Get the ICFGNode related to the creation of this object.
bool isConstantByteSize() const
Check if byte size is a const value.
u32_t getByteSizeOfObj() const
Get the byte size of this object.
IntervalValue getAccessOffset(AbstractState &as, NodeID objId, const GepStmt *gep)
Retrieves the access offset for a given object and GEP statement.
void addToGepObjOffsetFromBase(const GepObjVar *obj, const IntervalValue &offset)
Adds an offset to a GEP object.
Definition AEDetector.h:190
Map< std::string, std::vector< std::pair< u32_t, u32_t > > > extAPIBufOverflowCheckRules
Rules for checking buffer overflows in external APIs.
Definition AEDetector.h:318
void detect(AbstractState &as, const ICFGNode *)
Detect buffer overflow issues within a node.
bool detectStrcpy(AbstractState &as, const CallICFGNode *call)
Detects buffer overflow in 'strcpy' function calls.
bool detectStrcat(AbstractState &as, const CallICFGNode *call)
Detects buffer overflow in 'strcat' function calls.
IntervalValue getGepObjOffsetFromBase(const GepObjVar *obj) const
Retrieves the offset of a GEP object from its base.
Definition AEDetector.h:210
void handleStubFunctions(const CallICFGNode *)
Handles external API calls related to buffer overflow detection.
bool hasGepObjOffsetFromBase(const GepObjVar *obj) const
Checks if a GEP object has an associated offset.
Definition AEDetector.h:200
void updateGepObjOffsetFromBase(AddressValue gepAddrs, AddressValue objAddrs, IntervalValue offset)
Updates the offset of a GEP object from its base.
bool canSafelyAccessMemory(AbstractState &as, const SVFVar *value, const IntervalValue &len)
Checks if memory can be safely accessed.
void initExtAPIBufOverflowCheckRules()
Initializes external API buffer overflow check rules.
void detectExtAPI(AbstractState &as, const CallICFGNode *call)
Handles external API calls related to buffer overflow detection.
void addBugToReporter(const AEException &e, const ICFGNode *node)
Adds a bug to the reporter based on an exception.
Definition AEDetector.h:232
const std::string toString() const override
Definition ICFG.cpp:139
const ValVar * getArgument(u32_t ArgNo) const
Parameter operations.
Definition ICFGNode.h:494
const FunObjVar * getCalledFunction() const
Definition ICFGNode.h:512
static ExtAPI * getExtAPI()
Definition ExtAPI.cpp:43
const std::vector< std::string > & getExtFuncAnnotations(const FunObjVar *fun)
Definition ExtAPI.cpp:199
NodeType * getGNode(NodeID id) const
Get a node.
const SVFStmtList & getSVFStmts() const
Definition ICFGNode.h:117
static IntervalValue bottom()
Create the bottom IntervalValue [+inf, -inf].
static IntervalValue top()
Create the IntervalValue [-inf, +inf].
const BaseObjVar * getBaseObject(NodeID id) const
Definition SVFIR.h:423
static SVFIR * getPAG(bool buildFromFile=false)
Singleton design here to make sure we only have one instance during any analysis.
Definition SVFIR.h:116
NodeID getId() const
Get ID.
Definition SVFValue.h:158
virtual const std::string & getName() const
Definition SVFValue.h:184
std::ostream & errs()
Overwrite llvm::errs()
Definition SVFUtil.h:58
bool isExtCall(const FunObjVar *fun)
Definition SVFUtil.cpp:437
for isBitcode
Definition BasicTypes.h:68
u32_t NodeID
Definition GeneralType.h:56
llvm::IRBuilder IRBuilder
Definition BasicTypes.h:74
unsigned u32_t
Definition GeneralType.h:47