mirror of
https://github.com/llvm/llvm-project.git
synced 2025-05-02 19:26:05 +00:00

Although in a normal implementation the assumption is reasonable, it seems that some esoteric implementation are not returning a T&. This should be handled correctly and the values be propagated. --------- Co-authored-by: martinboehme <mboehme@google.com>
857 lines
29 KiB
C++
857 lines
29 KiB
C++
//===-- Transfer.cpp --------------------------------------------*- C++ -*-===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file defines transfer functions that evaluate program statements and
|
|
// update an environment accordingly.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "clang/Analysis/FlowSensitive/Transfer.h"
|
|
#include "clang/AST/Decl.h"
|
|
#include "clang/AST/DeclBase.h"
|
|
#include "clang/AST/DeclCXX.h"
|
|
#include "clang/AST/Expr.h"
|
|
#include "clang/AST/ExprCXX.h"
|
|
#include "clang/AST/OperationKinds.h"
|
|
#include "clang/AST/Stmt.h"
|
|
#include "clang/AST/StmtVisitor.h"
|
|
#include "clang/Analysis/FlowSensitive/ControlFlowContext.h"
|
|
#include "clang/Analysis/FlowSensitive/DataflowEnvironment.h"
|
|
#include "clang/Analysis/FlowSensitive/NoopAnalysis.h"
|
|
#include "clang/Analysis/FlowSensitive/RecordOps.h"
|
|
#include "clang/Analysis/FlowSensitive/Value.h"
|
|
#include "clang/Basic/Builtins.h"
|
|
#include "clang/Basic/OperatorKinds.h"
|
|
#include "llvm/Support/Casting.h"
|
|
#include "llvm/Support/Debug.h"
|
|
#include <assert.h>
|
|
#include <cassert>
|
|
|
|
#define DEBUG_TYPE "dataflow"
|
|
|
|
namespace clang {
|
|
namespace dataflow {
|
|
|
|
const Environment *StmtToEnvMap::getEnvironment(const Stmt &S) const {
|
|
auto BlockIt = CFCtx.getStmtToBlock().find(&ignoreCFGOmittedNodes(S));
|
|
assert(BlockIt != CFCtx.getStmtToBlock().end());
|
|
if (!CFCtx.isBlockReachable(*BlockIt->getSecond()))
|
|
return nullptr;
|
|
if (BlockIt->getSecond()->getBlockID() == CurBlockID)
|
|
return &CurState.Env;
|
|
const auto &State = BlockToState[BlockIt->getSecond()->getBlockID()];
|
|
if (!(State))
|
|
return nullptr;
|
|
return &State->Env;
|
|
}
|
|
|
|
static BoolValue &evaluateBooleanEquality(const Expr &LHS, const Expr &RHS,
|
|
Environment &Env) {
|
|
Value *LHSValue = Env.getValue(LHS);
|
|
Value *RHSValue = Env.getValue(RHS);
|
|
|
|
if (LHSValue == RHSValue)
|
|
return Env.getBoolLiteralValue(true);
|
|
|
|
if (auto *LHSBool = dyn_cast_or_null<BoolValue>(LHSValue))
|
|
if (auto *RHSBool = dyn_cast_or_null<BoolValue>(RHSValue))
|
|
return Env.makeIff(*LHSBool, *RHSBool);
|
|
|
|
return Env.makeAtomicBoolValue();
|
|
}
|
|
|
|
static BoolValue &unpackValue(BoolValue &V, Environment &Env) {
|
|
if (auto *Top = llvm::dyn_cast<TopBoolValue>(&V)) {
|
|
auto &A = Env.getDataflowAnalysisContext().arena();
|
|
return A.makeBoolValue(A.makeAtomRef(Top->getAtom()));
|
|
}
|
|
return V;
|
|
}
|
|
|
|
// Unpacks the value (if any) associated with `E` and updates `E` to the new
|
|
// value, if any unpacking occured. Also, does the lvalue-to-rvalue conversion,
|
|
// by skipping past the reference.
|
|
static Value *maybeUnpackLValueExpr(const Expr &E, Environment &Env) {
|
|
auto *Loc = Env.getStorageLocation(E);
|
|
if (Loc == nullptr)
|
|
return nullptr;
|
|
auto *Val = Env.getValue(*Loc);
|
|
|
|
auto *B = dyn_cast_or_null<BoolValue>(Val);
|
|
if (B == nullptr)
|
|
return Val;
|
|
|
|
auto &UnpackedVal = unpackValue(*B, Env);
|
|
if (&UnpackedVal == Val)
|
|
return Val;
|
|
Env.setValue(*Loc, UnpackedVal);
|
|
return &UnpackedVal;
|
|
}
|
|
|
|
static void propagateValue(const Expr &From, const Expr &To, Environment &Env) {
|
|
if (auto *Val = Env.getValue(From))
|
|
Env.setValue(To, *Val);
|
|
}
|
|
|
|
static void propagateStorageLocation(const Expr &From, const Expr &To,
|
|
Environment &Env) {
|
|
if (auto *Loc = Env.getStorageLocation(From))
|
|
Env.setStorageLocation(To, *Loc);
|
|
}
|
|
|
|
// Propagates the value or storage location of `From` to `To` in cases where
|
|
// `From` may be either a glvalue or a prvalue. `To` must be a glvalue iff
|
|
// `From` is a glvalue.
|
|
static void propagateValueOrStorageLocation(const Expr &From, const Expr &To,
|
|
Environment &Env) {
|
|
assert(From.isGLValue() == To.isGLValue());
|
|
if (From.isGLValue())
|
|
propagateStorageLocation(From, To, Env);
|
|
else
|
|
propagateValue(From, To, Env);
|
|
}
|
|
|
|
namespace {
|
|
|
|
class TransferVisitor : public ConstStmtVisitor<TransferVisitor> {
|
|
public:
|
|
TransferVisitor(const StmtToEnvMap &StmtToEnv, Environment &Env)
|
|
: StmtToEnv(StmtToEnv), Env(Env) {}
|
|
|
|
void VisitBinaryOperator(const BinaryOperator *S) {
|
|
const Expr *LHS = S->getLHS();
|
|
assert(LHS != nullptr);
|
|
|
|
const Expr *RHS = S->getRHS();
|
|
assert(RHS != nullptr);
|
|
|
|
switch (S->getOpcode()) {
|
|
case BO_Assign: {
|
|
auto *LHSLoc = Env.getStorageLocation(*LHS);
|
|
if (LHSLoc == nullptr)
|
|
break;
|
|
|
|
auto *RHSVal = Env.getValue(*RHS);
|
|
if (RHSVal == nullptr)
|
|
break;
|
|
|
|
// Assign a value to the storage location of the left-hand side.
|
|
Env.setValue(*LHSLoc, *RHSVal);
|
|
|
|
// Assign a storage location for the whole expression.
|
|
Env.setStorageLocation(*S, *LHSLoc);
|
|
break;
|
|
}
|
|
case BO_LAnd:
|
|
case BO_LOr: {
|
|
BoolValue &LHSVal = getLogicOperatorSubExprValue(*LHS);
|
|
BoolValue &RHSVal = getLogicOperatorSubExprValue(*RHS);
|
|
|
|
if (S->getOpcode() == BO_LAnd)
|
|
Env.setValue(*S, Env.makeAnd(LHSVal, RHSVal));
|
|
else
|
|
Env.setValue(*S, Env.makeOr(LHSVal, RHSVal));
|
|
break;
|
|
}
|
|
case BO_NE:
|
|
case BO_EQ: {
|
|
auto &LHSEqRHSValue = evaluateBooleanEquality(*LHS, *RHS, Env);
|
|
Env.setValue(*S, S->getOpcode() == BO_EQ ? LHSEqRHSValue
|
|
: Env.makeNot(LHSEqRHSValue));
|
|
break;
|
|
}
|
|
case BO_Comma: {
|
|
propagateValueOrStorageLocation(*RHS, *S, Env);
|
|
break;
|
|
}
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
void VisitDeclRefExpr(const DeclRefExpr *S) {
|
|
const ValueDecl *VD = S->getDecl();
|
|
assert(VD != nullptr);
|
|
|
|
// Some `DeclRefExpr`s aren't glvalues, so we can't associate them with a
|
|
// `StorageLocation`, and there's also no sensible `Value` that we can
|
|
// assign to them. Examples:
|
|
// - Non-static member variables
|
|
// - Non static member functions
|
|
// Note: Member operators are an exception to this, but apparently only
|
|
// if the `DeclRefExpr` is used within the callee of a
|
|
// `CXXOperatorCallExpr`. In other cases, for example when applying the
|
|
// address-of operator, the `DeclRefExpr` is a prvalue.
|
|
if (!S->isGLValue())
|
|
return;
|
|
|
|
auto *DeclLoc = Env.getStorageLocation(*VD);
|
|
if (DeclLoc == nullptr)
|
|
return;
|
|
|
|
Env.setStorageLocation(*S, *DeclLoc);
|
|
}
|
|
|
|
void VisitDeclStmt(const DeclStmt *S) {
|
|
// Group decls are converted into single decls in the CFG so the cast below
|
|
// is safe.
|
|
const auto &D = *cast<VarDecl>(S->getSingleDecl());
|
|
|
|
ProcessVarDecl(D);
|
|
}
|
|
|
|
void ProcessVarDecl(const VarDecl &D) {
|
|
// Static local vars are already initialized in `Environment`.
|
|
if (D.hasGlobalStorage())
|
|
return;
|
|
|
|
// If this is the holding variable for a `BindingDecl`, we may already
|
|
// have a storage location set up -- so check. (See also explanation below
|
|
// where we process the `BindingDecl`.)
|
|
if (D.getType()->isReferenceType() && Env.getStorageLocation(D) != nullptr)
|
|
return;
|
|
|
|
assert(Env.getStorageLocation(D) == nullptr);
|
|
|
|
Env.setStorageLocation(D, Env.createObject(D));
|
|
|
|
// `DecompositionDecl` must be handled after we've interpreted the loc
|
|
// itself, because the binding expression refers back to the
|
|
// `DecompositionDecl` (even though it has no written name).
|
|
if (const auto *Decomp = dyn_cast<DecompositionDecl>(&D)) {
|
|
// If VarDecl is a DecompositionDecl, evaluate each of its bindings. This
|
|
// needs to be evaluated after initializing the values in the storage for
|
|
// VarDecl, as the bindings refer to them.
|
|
// FIXME: Add support for ArraySubscriptExpr.
|
|
// FIXME: Consider adding AST nodes used in BindingDecls to the CFG.
|
|
for (const auto *B : Decomp->bindings()) {
|
|
if (auto *ME = dyn_cast_or_null<MemberExpr>(B->getBinding())) {
|
|
auto *DE = dyn_cast_or_null<DeclRefExpr>(ME->getBase());
|
|
if (DE == nullptr)
|
|
continue;
|
|
|
|
// ME and its base haven't been visited because they aren't included
|
|
// in the statements of the CFG basic block.
|
|
VisitDeclRefExpr(DE);
|
|
VisitMemberExpr(ME);
|
|
|
|
if (auto *Loc = Env.getStorageLocation(*ME))
|
|
Env.setStorageLocation(*B, *Loc);
|
|
} else if (auto *VD = B->getHoldingVar()) {
|
|
// Holding vars are used to back the `BindingDecl`s of tuple-like
|
|
// types. The holding var declarations appear after the
|
|
// `DecompositionDecl`, so we have to explicitly process them here
|
|
// to know their storage location. They will be processed a second
|
|
// time when we visit their `VarDecl`s, so we have code that protects
|
|
// against this above.
|
|
ProcessVarDecl(*VD);
|
|
auto *VDLoc = Env.getStorageLocation(*VD);
|
|
assert(VDLoc != nullptr);
|
|
Env.setStorageLocation(*B, *VDLoc);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void VisitImplicitCastExpr(const ImplicitCastExpr *S) {
|
|
const Expr *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
|
|
switch (S->getCastKind()) {
|
|
case CK_IntegralToBoolean: {
|
|
// This cast creates a new, boolean value from the integral value. We
|
|
// model that with a fresh value in the environment, unless it's already a
|
|
// boolean.
|
|
if (auto *SubExprVal =
|
|
dyn_cast_or_null<BoolValue>(Env.getValue(*SubExpr)))
|
|
Env.setValue(*S, *SubExprVal);
|
|
else
|
|
// FIXME: If integer modeling is added, then update this code to create
|
|
// the boolean based on the integer model.
|
|
Env.setValue(*S, Env.makeAtomicBoolValue());
|
|
break;
|
|
}
|
|
|
|
case CK_LValueToRValue: {
|
|
// When an L-value is used as an R-value, it may result in sharing, so we
|
|
// need to unpack any nested `Top`s.
|
|
auto *SubExprVal = maybeUnpackLValueExpr(*SubExpr, Env);
|
|
if (SubExprVal == nullptr)
|
|
break;
|
|
|
|
Env.setValue(*S, *SubExprVal);
|
|
break;
|
|
}
|
|
|
|
case CK_IntegralCast:
|
|
// FIXME: This cast creates a new integral value from the
|
|
// subexpression. But, because we don't model integers, we don't
|
|
// distinguish between this new value and the underlying one. If integer
|
|
// modeling is added, then update this code to create a fresh location and
|
|
// value.
|
|
case CK_UncheckedDerivedToBase:
|
|
case CK_ConstructorConversion:
|
|
case CK_UserDefinedConversion:
|
|
// FIXME: Add tests that excercise CK_UncheckedDerivedToBase,
|
|
// CK_ConstructorConversion, and CK_UserDefinedConversion.
|
|
case CK_NoOp: {
|
|
// FIXME: Consider making `Environment::getStorageLocation` skip noop
|
|
// expressions (this and other similar expressions in the file) instead
|
|
// of assigning them storage locations.
|
|
propagateValueOrStorageLocation(*SubExpr, *S, Env);
|
|
break;
|
|
}
|
|
case CK_NullToPointer: {
|
|
auto &NullPointerVal =
|
|
Env.getOrCreateNullPointerValue(S->getType()->getPointeeType());
|
|
Env.setValue(*S, NullPointerVal);
|
|
break;
|
|
}
|
|
case CK_NullToMemberPointer:
|
|
// FIXME: Implement pointers to members. For now, don't associate a value
|
|
// with this expression.
|
|
break;
|
|
case CK_FunctionToPointerDecay: {
|
|
StorageLocation *PointeeLoc = Env.getStorageLocation(*SubExpr);
|
|
if (PointeeLoc == nullptr)
|
|
break;
|
|
|
|
Env.setValue(*S, Env.create<PointerValue>(*PointeeLoc));
|
|
break;
|
|
}
|
|
case CK_BuiltinFnToFnPtr:
|
|
// Despite its name, the result type of `BuiltinFnToFnPtr` is a function,
|
|
// not a function pointer. In addition, builtin functions can only be
|
|
// called directly; it is not legal to take their address. We therefore
|
|
// don't need to create a value or storage location for them.
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
void VisitUnaryOperator(const UnaryOperator *S) {
|
|
const Expr *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
|
|
switch (S->getOpcode()) {
|
|
case UO_Deref: {
|
|
const auto *SubExprVal = Env.get<PointerValue>(*SubExpr);
|
|
if (SubExprVal == nullptr)
|
|
break;
|
|
|
|
Env.setStorageLocation(*S, SubExprVal->getPointeeLoc());
|
|
break;
|
|
}
|
|
case UO_AddrOf: {
|
|
// FIXME: Model pointers to members.
|
|
if (S->getType()->isMemberPointerType())
|
|
break;
|
|
|
|
if (StorageLocation *PointeeLoc = Env.getStorageLocation(*SubExpr))
|
|
Env.setValue(*S, Env.create<PointerValue>(*PointeeLoc));
|
|
break;
|
|
}
|
|
case UO_LNot: {
|
|
auto *SubExprVal = dyn_cast_or_null<BoolValue>(Env.getValue(*SubExpr));
|
|
if (SubExprVal == nullptr)
|
|
break;
|
|
|
|
Env.setValue(*S, Env.makeNot(*SubExprVal));
|
|
break;
|
|
}
|
|
default:
|
|
break;
|
|
}
|
|
}
|
|
|
|
void VisitCXXThisExpr(const CXXThisExpr *S) {
|
|
auto *ThisPointeeLoc = Env.getThisPointeeStorageLocation();
|
|
if (ThisPointeeLoc == nullptr)
|
|
// Unions are not supported yet, and will not have a location for the
|
|
// `this` expression's pointee.
|
|
return;
|
|
|
|
Env.setValue(*S, Env.create<PointerValue>(*ThisPointeeLoc));
|
|
}
|
|
|
|
void VisitCXXNewExpr(const CXXNewExpr *S) {
|
|
if (Value *Val = Env.createValue(S->getType()))
|
|
Env.setValue(*S, *Val);
|
|
}
|
|
|
|
void VisitCXXDeleteExpr(const CXXDeleteExpr *S) {
|
|
// Empty method.
|
|
// We consciously don't do anything on deletes. Diagnosing double deletes
|
|
// (for example) should be done by a specific analysis, not by the
|
|
// framework.
|
|
}
|
|
|
|
void VisitReturnStmt(const ReturnStmt *S) {
|
|
if (!Env.getDataflowAnalysisContext().getOptions().ContextSensitiveOpts)
|
|
return;
|
|
|
|
auto *Ret = S->getRetValue();
|
|
if (Ret == nullptr)
|
|
return;
|
|
|
|
if (Ret->isPRValue()) {
|
|
auto *Val = Env.getValue(*Ret);
|
|
if (Val == nullptr)
|
|
return;
|
|
|
|
// FIXME: Model NRVO.
|
|
Env.setReturnValue(Val);
|
|
} else {
|
|
auto *Loc = Env.getStorageLocation(*Ret);
|
|
if (Loc == nullptr)
|
|
return;
|
|
|
|
// FIXME: Model NRVO.
|
|
Env.setReturnStorageLocation(Loc);
|
|
}
|
|
}
|
|
|
|
void VisitMemberExpr(const MemberExpr *S) {
|
|
ValueDecl *Member = S->getMemberDecl();
|
|
assert(Member != nullptr);
|
|
|
|
// FIXME: Consider assigning pointer values to function member expressions.
|
|
if (Member->isFunctionOrFunctionTemplate())
|
|
return;
|
|
|
|
// FIXME: if/when we add support for modeling enums, use that support here.
|
|
if (isa<EnumConstantDecl>(Member))
|
|
return;
|
|
|
|
if (auto *D = dyn_cast<VarDecl>(Member)) {
|
|
if (D->hasGlobalStorage()) {
|
|
auto *VarDeclLoc = Env.getStorageLocation(*D);
|
|
if (VarDeclLoc == nullptr)
|
|
return;
|
|
|
|
Env.setStorageLocation(*S, *VarDeclLoc);
|
|
return;
|
|
}
|
|
}
|
|
|
|
RecordStorageLocation *BaseLoc = getBaseObjectLocation(*S, Env);
|
|
if (BaseLoc == nullptr)
|
|
return;
|
|
|
|
auto *MemberLoc = BaseLoc->getChild(*Member);
|
|
if (MemberLoc == nullptr)
|
|
return;
|
|
Env.setStorageLocation(*S, *MemberLoc);
|
|
}
|
|
|
|
void VisitCXXDefaultInitExpr(const CXXDefaultInitExpr *S) {
|
|
const Expr *InitExpr = S->getExpr();
|
|
assert(InitExpr != nullptr);
|
|
propagateValueOrStorageLocation(*InitExpr, *S, Env);
|
|
}
|
|
|
|
void VisitCXXConstructExpr(const CXXConstructExpr *S) {
|
|
const CXXConstructorDecl *ConstructorDecl = S->getConstructor();
|
|
assert(ConstructorDecl != nullptr);
|
|
|
|
if (ConstructorDecl->isCopyOrMoveConstructor()) {
|
|
// It is permissible for a copy/move constructor to have additional
|
|
// parameters as long as they have default arguments defined for them.
|
|
assert(S->getNumArgs() != 0);
|
|
|
|
const Expr *Arg = S->getArg(0);
|
|
assert(Arg != nullptr);
|
|
|
|
auto *ArgLoc = Env.get<RecordStorageLocation>(*Arg);
|
|
if (ArgLoc == nullptr)
|
|
return;
|
|
|
|
if (S->isElidable()) {
|
|
if (Value *Val = Env.getValue(*ArgLoc))
|
|
Env.setValue(*S, *Val);
|
|
} else {
|
|
auto &Val = *cast<RecordValue>(Env.createValue(S->getType()));
|
|
Env.setValue(*S, Val);
|
|
copyRecord(*ArgLoc, Val.getLoc(), Env);
|
|
}
|
|
return;
|
|
}
|
|
|
|
// `CXXConstructExpr` can have array type if default-initializing an array
|
|
// of records, and we currently can't create values for arrays. So check if
|
|
// we've got a record type.
|
|
if (S->getType()->isRecordType()) {
|
|
auto &InitialVal = *cast<RecordValue>(Env.createValue(S->getType()));
|
|
Env.setValue(*S, InitialVal);
|
|
}
|
|
|
|
transferInlineCall(S, ConstructorDecl);
|
|
}
|
|
|
|
void VisitCXXOperatorCallExpr(const CXXOperatorCallExpr *S) {
|
|
if (S->getOperator() == OO_Equal) {
|
|
assert(S->getNumArgs() == 2);
|
|
|
|
const Expr *Arg0 = S->getArg(0);
|
|
assert(Arg0 != nullptr);
|
|
|
|
const Expr *Arg1 = S->getArg(1);
|
|
assert(Arg1 != nullptr);
|
|
|
|
// Evaluate only copy and move assignment operators.
|
|
const auto *Method =
|
|
dyn_cast_or_null<CXXMethodDecl>(S->getDirectCallee());
|
|
if (!Method)
|
|
return;
|
|
if (!Method->isCopyAssignmentOperator() &&
|
|
!Method->isMoveAssignmentOperator())
|
|
return;
|
|
|
|
RecordStorageLocation *LocSrc = nullptr;
|
|
if (Arg1->isPRValue()) {
|
|
if (auto *Val = Env.get<RecordValue>(*Arg1))
|
|
LocSrc = &Val->getLoc();
|
|
} else {
|
|
LocSrc = Env.get<RecordStorageLocation>(*Arg1);
|
|
}
|
|
auto *LocDst = Env.get<RecordStorageLocation>(*Arg0);
|
|
|
|
if (LocSrc == nullptr || LocDst == nullptr)
|
|
return;
|
|
|
|
// The assignment operators are different from the type of the destination
|
|
// in this model (i.e. in one of their base classes). This must be very
|
|
// rare and we just bail.
|
|
if (Method->getFunctionObjectParameterType()
|
|
.getCanonicalType()
|
|
.getUnqualifiedType() !=
|
|
LocDst->getType().getCanonicalType().getUnqualifiedType())
|
|
return;
|
|
|
|
copyRecord(*LocSrc, *LocDst, Env);
|
|
|
|
// If the expr is a glvalue, we can reasonably assume the operator is
|
|
// returning T& and thus we can assign it `LocDst`.
|
|
if (S->isGLValue()) {
|
|
Env.setStorageLocation(*S, *LocDst);
|
|
} else if (S->getType()->isRecordType()) {
|
|
// Make sure that we have a `RecordValue` for this expression so that
|
|
// `Environment::getResultObjectLocation()` is able to return a location
|
|
// for it.
|
|
if (Env.getValue(*S) == nullptr)
|
|
refreshRecordValue(*S, Env);
|
|
}
|
|
|
|
return;
|
|
}
|
|
|
|
// CXXOperatorCallExpr can be prvalues. Call `VisitCallExpr`() to create
|
|
// a `RecordValue` for them so that `Environment::getResultObjectLocation()`
|
|
// can return a value.
|
|
VisitCallExpr(S);
|
|
}
|
|
|
|
void VisitCXXRewrittenBinaryOperator(const CXXRewrittenBinaryOperator *RBO) {
|
|
propagateValue(*RBO->getSemanticForm(), *RBO, Env);
|
|
}
|
|
|
|
void VisitCXXFunctionalCastExpr(const CXXFunctionalCastExpr *S) {
|
|
if (S->getCastKind() == CK_ConstructorConversion) {
|
|
const Expr *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
|
|
propagateValue(*SubExpr, *S, Env);
|
|
}
|
|
}
|
|
|
|
void VisitCXXTemporaryObjectExpr(const CXXTemporaryObjectExpr *S) {
|
|
if (Value *Val = Env.createValue(S->getType()))
|
|
Env.setValue(*S, *Val);
|
|
}
|
|
|
|
void VisitCallExpr(const CallExpr *S) {
|
|
// Of clang's builtins, only `__builtin_expect` is handled explicitly, since
|
|
// others (like trap, debugtrap, and unreachable) are handled by CFG
|
|
// construction.
|
|
if (S->isCallToStdMove()) {
|
|
assert(S->getNumArgs() == 1);
|
|
|
|
const Expr *Arg = S->getArg(0);
|
|
assert(Arg != nullptr);
|
|
|
|
auto *ArgLoc = Env.getStorageLocation(*Arg);
|
|
if (ArgLoc == nullptr)
|
|
return;
|
|
|
|
Env.setStorageLocation(*S, *ArgLoc);
|
|
} else if (S->getDirectCallee() != nullptr &&
|
|
S->getDirectCallee()->getBuiltinID() ==
|
|
Builtin::BI__builtin_expect) {
|
|
assert(S->getNumArgs() > 0);
|
|
assert(S->getArg(0) != nullptr);
|
|
auto *ArgVal = Env.getValue(*S->getArg(0));
|
|
if (ArgVal == nullptr)
|
|
return;
|
|
Env.setValue(*S, *ArgVal);
|
|
} else if (const FunctionDecl *F = S->getDirectCallee()) {
|
|
transferInlineCall(S, F);
|
|
|
|
// If this call produces a prvalue of record type, make sure that we have
|
|
// a `RecordValue` for it. This is required so that
|
|
// `Environment::getResultObjectLocation()` is able to return a location
|
|
// for this `CallExpr`.
|
|
if (S->getType()->isRecordType() && S->isPRValue())
|
|
if (Env.getValue(*S) == nullptr)
|
|
refreshRecordValue(*S, Env);
|
|
}
|
|
}
|
|
|
|
void VisitMaterializeTemporaryExpr(const MaterializeTemporaryExpr *S) {
|
|
const Expr *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
|
|
Value *SubExprVal = Env.getValue(*SubExpr);
|
|
if (SubExprVal == nullptr)
|
|
return;
|
|
|
|
if (RecordValue *RecordVal = dyn_cast<RecordValue>(SubExprVal)) {
|
|
Env.setStorageLocation(*S, RecordVal->getLoc());
|
|
return;
|
|
}
|
|
|
|
StorageLocation &Loc = Env.createStorageLocation(*S);
|
|
Env.setValue(Loc, *SubExprVal);
|
|
Env.setStorageLocation(*S, Loc);
|
|
}
|
|
|
|
void VisitCXXBindTemporaryExpr(const CXXBindTemporaryExpr *S) {
|
|
const Expr *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
|
|
propagateValue(*SubExpr, *S, Env);
|
|
}
|
|
|
|
void VisitCXXStaticCastExpr(const CXXStaticCastExpr *S) {
|
|
if (S->getCastKind() == CK_NoOp) {
|
|
const Expr *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
|
|
propagateValueOrStorageLocation(*SubExpr, *S, Env);
|
|
}
|
|
}
|
|
|
|
void VisitConditionalOperator(const ConditionalOperator *S) {
|
|
// FIXME: Revisit this once flow conditions are added to the framework. For
|
|
// `a = b ? c : d` we can add `b => a == c && !b => a == d` to the flow
|
|
// condition.
|
|
// When we do this, we will need to retrieve the values of the operands from
|
|
// the environments for the basic blocks they are computed in, in a similar
|
|
// way to how this is done for short-circuited logical operators in
|
|
// `getLogicOperatorSubExprValue()`.
|
|
if (S->isGLValue())
|
|
Env.setStorageLocation(*S, Env.createObject(S->getType()));
|
|
else if (Value *Val = Env.createValue(S->getType()))
|
|
Env.setValue(*S, *Val);
|
|
}
|
|
|
|
void VisitInitListExpr(const InitListExpr *S) {
|
|
QualType Type = S->getType();
|
|
|
|
if (!Type->isStructureOrClassType()) {
|
|
if (auto *Val = Env.createValue(Type))
|
|
Env.setValue(*S, *Val);
|
|
|
|
return;
|
|
}
|
|
|
|
// In case the initializer list is transparent, we just need to propagate
|
|
// the value that it contains.
|
|
if (S->isSemanticForm() && S->isTransparent()) {
|
|
propagateValue(*S->getInit(0), *S, Env);
|
|
return;
|
|
}
|
|
|
|
llvm::DenseMap<const ValueDecl *, StorageLocation *> FieldLocs;
|
|
|
|
// This only contains the direct fields for the given type.
|
|
std::vector<FieldDecl *> FieldsForInit =
|
|
getFieldsForInitListExpr(Type->getAsRecordDecl());
|
|
|
|
// `S->inits()` contains all the initializer epressions, including the
|
|
// ones for direct base classes.
|
|
auto Inits = S->inits();
|
|
size_t InitIdx = 0;
|
|
|
|
// Initialize base classes.
|
|
if (auto* R = S->getType()->getAsCXXRecordDecl()) {
|
|
assert(FieldsForInit.size() + R->getNumBases() == Inits.size());
|
|
for ([[maybe_unused]] const CXXBaseSpecifier &Base : R->bases()) {
|
|
assert(InitIdx < Inits.size());
|
|
auto Init = Inits[InitIdx++];
|
|
assert(Base.getType().getCanonicalType() ==
|
|
Init->getType().getCanonicalType());
|
|
auto *BaseVal = Env.get<RecordValue>(*Init);
|
|
if (!BaseVal)
|
|
BaseVal = cast<RecordValue>(Env.createValue(Init->getType()));
|
|
// Take ownership of the fields of the `RecordValue` for the base class
|
|
// and incorporate them into the "flattened" set of fields for the
|
|
// derived class.
|
|
auto Children = BaseVal->getLoc().children();
|
|
FieldLocs.insert(Children.begin(), Children.end());
|
|
}
|
|
}
|
|
|
|
assert(FieldsForInit.size() == Inits.size() - InitIdx);
|
|
for (auto Field : FieldsForInit) {
|
|
assert(InitIdx < Inits.size());
|
|
auto Init = Inits[InitIdx++];
|
|
assert(
|
|
// The types are same, or
|
|
Field->getType().getCanonicalType().getUnqualifiedType() ==
|
|
Init->getType().getCanonicalType().getUnqualifiedType() ||
|
|
// The field's type is T&, and initializer is T
|
|
(Field->getType()->isReferenceType() &&
|
|
Field->getType().getCanonicalType()->getPointeeType() ==
|
|
Init->getType().getCanonicalType()));
|
|
auto& Loc = Env.createObject(Field->getType(), Init);
|
|
FieldLocs.insert({Field, &Loc});
|
|
}
|
|
|
|
// Check that we satisfy the invariant that a `RecordStorageLoation`
|
|
// contains exactly the set of modeled fields for that type.
|
|
// `ModeledFields` includes fields from all the bases, but only the
|
|
// modeled ones. However, if a class type is initialized with an
|
|
// `InitListExpr`, all fields in the class, including those from base
|
|
// classes, are included in the set of modeled fields. The code above
|
|
// should therefore populate exactly the modeled fields.
|
|
assert(containsSameFields(
|
|
Env.getDataflowAnalysisContext().getModeledFields(Type), FieldLocs));
|
|
|
|
RecordStorageLocation::SyntheticFieldMap SyntheticFieldLocs;
|
|
for (const auto &Entry :
|
|
Env.getDataflowAnalysisContext().getSyntheticFields(Type)) {
|
|
SyntheticFieldLocs.insert(
|
|
{Entry.getKey(), &Env.createObject(Entry.getValue())});
|
|
}
|
|
|
|
auto &Loc = Env.getDataflowAnalysisContext().createRecordStorageLocation(
|
|
Type, std::move(FieldLocs), std::move(SyntheticFieldLocs));
|
|
RecordValue &RecordVal = Env.create<RecordValue>(Loc);
|
|
|
|
Env.setValue(Loc, RecordVal);
|
|
|
|
Env.setValue(*S, RecordVal);
|
|
|
|
// FIXME: Implement array initialization.
|
|
}
|
|
|
|
void VisitCXXBoolLiteralExpr(const CXXBoolLiteralExpr *S) {
|
|
Env.setValue(*S, Env.getBoolLiteralValue(S->getValue()));
|
|
}
|
|
|
|
void VisitIntegerLiteral(const IntegerLiteral *S) {
|
|
Env.setValue(*S, Env.getIntLiteralValue(S->getValue()));
|
|
}
|
|
|
|
void VisitParenExpr(const ParenExpr *S) {
|
|
// The CFG does not contain `ParenExpr` as top-level statements in basic
|
|
// blocks, however manual traversal to sub-expressions may encounter them.
|
|
// Redirect to the sub-expression.
|
|
auto *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
Visit(SubExpr);
|
|
}
|
|
|
|
void VisitExprWithCleanups(const ExprWithCleanups *S) {
|
|
// The CFG does not contain `ExprWithCleanups` as top-level statements in
|
|
// basic blocks, however manual traversal to sub-expressions may encounter
|
|
// them. Redirect to the sub-expression.
|
|
auto *SubExpr = S->getSubExpr();
|
|
assert(SubExpr != nullptr);
|
|
Visit(SubExpr);
|
|
}
|
|
|
|
private:
|
|
/// Returns the value for the sub-expression `SubExpr` of a logic operator.
|
|
BoolValue &getLogicOperatorSubExprValue(const Expr &SubExpr) {
|
|
// `SubExpr` and its parent logic operator might be part of different basic
|
|
// blocks. We try to access the value that is assigned to `SubExpr` in the
|
|
// corresponding environment.
|
|
if (const Environment *SubExprEnv = StmtToEnv.getEnvironment(SubExpr))
|
|
if (auto *Val =
|
|
dyn_cast_or_null<BoolValue>(SubExprEnv->getValue(SubExpr)))
|
|
return *Val;
|
|
|
|
// The sub-expression may lie within a basic block that isn't reachable,
|
|
// even if we need it to evaluate the current (reachable) expression
|
|
// (see https://discourse.llvm.org/t/70775). In this case, visit `SubExpr`
|
|
// within the current environment and then try to get the value that gets
|
|
// assigned to it.
|
|
if (Env.getValue(SubExpr) == nullptr)
|
|
Visit(&SubExpr);
|
|
if (auto *Val = dyn_cast_or_null<BoolValue>(Env.getValue(SubExpr)))
|
|
return *Val;
|
|
|
|
// If the value of `SubExpr` is still unknown, we create a fresh symbolic
|
|
// boolean value for it.
|
|
return Env.makeAtomicBoolValue();
|
|
}
|
|
|
|
// If context sensitivity is enabled, try to analyze the body of the callee
|
|
// `F` of `S`. The type `E` must be either `CallExpr` or `CXXConstructExpr`.
|
|
template <typename E>
|
|
void transferInlineCall(const E *S, const FunctionDecl *F) {
|
|
const auto &Options = Env.getDataflowAnalysisContext().getOptions();
|
|
if (!(Options.ContextSensitiveOpts &&
|
|
Env.canDescend(Options.ContextSensitiveOpts->Depth, F)))
|
|
return;
|
|
|
|
const ControlFlowContext *CFCtx =
|
|
Env.getDataflowAnalysisContext().getControlFlowContext(F);
|
|
if (!CFCtx)
|
|
return;
|
|
|
|
// FIXME: We don't support context-sensitive analysis of recursion, so
|
|
// we should return early here if `F` is the same as the `FunctionDecl`
|
|
// holding `S` itself.
|
|
|
|
auto ExitBlock = CFCtx->getCFG().getExit().getBlockID();
|
|
|
|
auto CalleeEnv = Env.pushCall(S);
|
|
|
|
// FIXME: Use the same analysis as the caller for the callee. Note,
|
|
// though, that doing so would require support for changing the analysis's
|
|
// ASTContext.
|
|
auto Analysis = NoopAnalysis(CFCtx->getDecl().getASTContext(),
|
|
DataflowAnalysisOptions{Options});
|
|
|
|
auto BlockToOutputState =
|
|
dataflow::runDataflowAnalysis(*CFCtx, Analysis, CalleeEnv);
|
|
assert(BlockToOutputState);
|
|
assert(ExitBlock < BlockToOutputState->size());
|
|
|
|
auto &ExitState = (*BlockToOutputState)[ExitBlock];
|
|
assert(ExitState);
|
|
|
|
Env.popCall(S, ExitState->Env);
|
|
}
|
|
|
|
const StmtToEnvMap &StmtToEnv;
|
|
Environment &Env;
|
|
};
|
|
|
|
} // namespace
|
|
|
|
void transfer(const StmtToEnvMap &StmtToEnv, const Stmt &S, Environment &Env) {
|
|
TransferVisitor(StmtToEnv, Env).Visit(&S);
|
|
}
|
|
|
|
} // namespace dataflow
|
|
} // namespace clang
|