From 514ac7c44d1f579240fd97cace4e2471913aaa70 Mon Sep 17 00:00:00 2001 From: Parth Date: Sun, 10 Apr 2022 21:45:09 +0530 Subject: [PATCH] add support for operator overload in reverse mode --- .../ReverseModeForwPassVisitor.cpp | 4 +- lib/Differentiator/ReverseModeVisitor.cpp | 101 ++++++++++++------ test/Gradient/MemberFunctions.C | 51 ++++++++- 3 files changed, 117 insertions(+), 39 deletions(-) diff --git a/lib/Differentiator/ReverseModeForwPassVisitor.cpp b/lib/Differentiator/ReverseModeForwPassVisitor.cpp index c22f4fadf..5b4f41f6c 100644 --- a/lib/Differentiator/ReverseModeForwPassVisitor.cpp +++ b/lib/Differentiator/ReverseModeForwPassVisitor.cpp @@ -29,7 +29,7 @@ ReverseModeForwPassVisitor::Derive(const FunctionDecl* FD, DiffParams args{}; std::copy(FD->param_begin(), FD->param_end(), std::back_inserter(args)); - auto fnName = m_Function->getNameAsString() + "_forw"; + auto fnName = clad::utils::ComputeEffectiveFnName(m_Function) + "_forw"; auto fnDNI = utils::BuildDeclarationNameInfo(m_Sema, fnName); auto paramTypes = ComputeParamTypes(args); @@ -86,8 +86,6 @@ ReverseModeForwPassVisitor::Derive(const FunctionDecl* FD, QualType ReverseModeForwPassVisitor::GetParameterDerivativeType(QualType yType, QualType xType) { - assert(yType.getNonReferenceType()->isRealType() && - "yType should be a builtin-numerical scalar type!!"); QualType xValueType = utils::GetValueType(xType); // derivative variables should always be of non-const type. xValueType.removeLocalConst(); diff --git a/lib/Differentiator/ReverseModeVisitor.cpp b/lib/Differentiator/ReverseModeVisitor.cpp index 9e00797f2..c2b5a9b69 100644 --- a/lib/Differentiator/ReverseModeVisitor.cpp +++ b/lib/Differentiator/ReverseModeVisitor.cpp @@ -1371,7 +1371,8 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, // If the function has no args and is not a member function call then we // assume that it is not related to independent variables and does not // contribute to gradient. - if (!NArgs && !isa(CE)) + if ((NArgs == 0U) && !isa(CE) && + !isa(CE)) return StmtDiff(Clone(CE)); // Stores the call arguments for the function to be derived @@ -1391,7 +1392,7 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, // derived function. In the case of member functions, `implicit` // this object is always passed by reference. if (!dfdx() && !utils::HasAnyReferenceOrPointerArgument(FD) && - !isa(CE)) { + !isa(CE) && !isa(CE)) { for (const Expr* Arg : CE->arguments()) { StmtDiff ArgDiff = Visit(Arg, dfdx()); CallArgs.push_back(ArgDiff.getExpr()); @@ -1415,9 +1416,14 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, // FIXME: We should add instructions for handling non-differentiable // arguments. Currently we are implicitly assuming function call only // contains differentiable arguments. - for (std::size_t i = 0, e = CE->getNumArgs(); i != e; ++i) { + bool isCXXOperatorCall = isa(CE); + + for (std::size_t i = static_cast(isCXXOperatorCall), + e = CE->getNumArgs(); + i != e; ++i) { const Expr* arg = CE->getArg(i); - auto PVD = FD->getParamDecl(i); + const auto* PVD = + FD->getParamDecl(i - static_cast(isCXXOperatorCall)); StmtDiff argDiff{}; bool passByRef = utils::IsReferenceOrPointerType(PVD->getType()); // We do not need to create result arg for arguments passed by reference @@ -1599,25 +1605,28 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, /// `CE` is a call to an instance member function. if (auto MCE = dyn_cast(CE)) { baseDiff = Visit(MCE->getImplicitObjectArgument()); - StmtDiff baseDiffStore = GlobalStoreAndRef(baseDiff.getExpr()); - if (isInsideLoop) { - addToCurrentBlock(baseDiffStore.getExpr()); - VarDecl* baseLocalVD = BuildVarDecl( - baseDiffStore.getExpr_dx()->getType(), - CreateUniqueIdentifier("_r"), baseDiffStore.getExpr_dx(), - /*DirectInit=*/false, /*TSI=*/nullptr, - VarDecl::InitializationStyle::CInit); - auto& block = getCurrentBlock(direction::reverse); - block.insert(block.begin() + insertionPoint, - BuildDeclStmt(baseLocalVD)); - insertionPoint += 1; - Expr* baseLocalE = BuildDeclRef(baseLocalVD); - baseDiffStore = {baseDiffStore.getExpr(), baseLocalE}; + else if (const auto* OCE = dyn_cast(CE)) baseDiff = + Visit(OCE->getArg(0)); + if (baseDiff.getExpr()) { + StmtDiff baseDiffStore = GlobalStoreAndRef(baseDiff.getExpr()); + if (isInsideLoop) { + addToCurrentBlock(baseDiffStore.getExpr()); + VarDecl* baseLocalVD = BuildVarDecl( + baseDiffStore.getExpr_dx()->getType(), + CreateUniqueIdentifier("_r"), baseDiffStore.getExpr_dx(), + /*DirectInit=*/false, /*TSI=*/nullptr, + VarDecl::InitializationStyle::CInit); + auto& block = getCurrentBlock(direction::reverse); + block.insert(block.begin() + insertionPoint, + BuildDeclStmt(baseLocalVD)); + insertionPoint += 1; + Expr* baseLocalE = BuildDeclRef(baseLocalVD); + baseDiffStore = {baseDiffStore.getExpr(), baseLocalE}; + } + baseDiff = {baseDiffStore.getExpr_dx(), baseDiff.getExpr_dx()}; + DerivedCallOutputArgs.push_back( + BuildOp(UnaryOperatorKind::UO_AddrOf, baseDiff.getExpr_dx())); } - baseDiff = {baseDiffStore.getExpr_dx(), baseDiff.getExpr_dx()}; - DerivedCallOutputArgs.push_back( - BuildOp(UnaryOperatorKind::UO_AddrOf, baseDiff.getExpr_dx())); - } for (auto argDerivative : CallArgDx) { gradVarDecl = nullptr; @@ -1689,15 +1698,24 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, pullbackCallArgs = DerivedCallArgs; if (pullback) - pullbackCallArgs.insert(pullbackCallArgs.begin() + CE->getNumArgs(), + pullbackCallArgs.insert(pullbackCallArgs.begin() + CE->getNumArgs() - + static_cast(isCXXOperatorCall), pullback); // Try to find it in builtin derivatives - std::string customPullback = FD->getNameAsString() + "_pullback"; + if (baseDiff.getExpr()) { + pullbackCallArgs.insert( + pullbackCallArgs.begin(), + BuildOp(UnaryOperatorKind::UO_AddrOf, baseDiff.getExpr())); + } + std::string customPullback = + clad::utils::ComputeEffectiveFnName(FD) + "_pullback"; OverloadedDerivedFn = m_Builder.BuildCallToCustomDerivativeOrNumericalDiff( customPullback, pullbackCallArgs, getCurrentScope(), const_cast(FD->getDeclContext())); + if (baseDiff.getExpr()) + pullbackCallArgs.erase(pullbackCallArgs.begin()); } // should be true if we are using numerical differentiation to differentiate @@ -1728,7 +1746,8 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, // derive the called function. DiffRequest pullbackRequest{}; pullbackRequest.Function = FD; - pullbackRequest.BaseFunctionName = FD->getNameAsString(); + pullbackRequest.BaseFunctionName = + clad::utils::ComputeEffectiveFnName(FD); pullbackRequest.Mode = DiffMode::experimental_pullback; // Silence diag outputs in nested derivation process. pullbackRequest.VerboseDiags = false; @@ -1775,7 +1794,7 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, usingNumericalDiff = true; } } else if (pullbackFD) { - if (isa(CE)) { + if (baseDiff.getExpr()) { Expr* baseE = baseDiff.getExpr(); OverloadedDerivedFn = BuildCallExprToMemFn( baseE, pullbackFD->getName(), pullbackCallArgs, pullbackFD); @@ -1861,7 +1880,8 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, DiffRequest calleeFnForwPassReq; calleeFnForwPassReq.Function = FD; calleeFnForwPassReq.Mode = DiffMode::reverse_mode_forward_pass; - calleeFnForwPassReq.BaseFunctionName = FD->getNameAsString(); + calleeFnForwPassReq.BaseFunctionName = + clad::utils::ComputeEffectiveFnName(FD); calleeFnForwPassReq.VerboseDiags = true; FunctionDecl* calleeFnForwPassFD = plugin::ProcessDiffRequest(m_CladPlugin, calleeFnForwPassReq); @@ -1878,20 +1898,24 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, // We cannot reuse the derivatives previously computed because // they might contain 'clad::pop(..)` expression. - if (isa(CE)) { + if (isa(CE) || isa(CE)) { Expr* derivedBase = baseDiff.getExpr_dx(); // FIXME: We may need this if-block once we support pointers, and // passing pointers-by-reference if // (isCladArrayType(derivedBase->getType())) // CallArgs.push_back(derivedBase); // else + // Currently derivedBase `*d_this` can never be CladArrayType CallArgs.push_back( BuildOp(UnaryOperatorKind::UO_AddrOf, derivedBase, noLoc)); } - for (std::size_t i = 0, e = CE->getNumArgs(); i != e; ++i) { + for (std::size_t i = static_cast(isCXXOperatorCall), + e = CE->getNumArgs(); + i != e; ++i) { const Expr* arg = CE->getArg(i); - const ParmVarDecl* PVD = FD->getParamDecl(i); + const ParmVarDecl* PVD = + FD->getParamDecl(i - static_cast(isCXXOperatorCall)); StmtDiff argDiff = Visit(arg); if ((argDiff.getExpr_dx() != nullptr) && PVD->getType()->isReferenceType()) { @@ -1906,7 +1930,7 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, } else CallArgs.push_back(m_Sema.ActOnCXXNullPtrLiteral(noLoc).get()); } - if (isa(CE)) { + if (isa(CE) || isa(CE)) { Expr* baseE = baseDiff.getExpr(); call = BuildCallExprToMemFn(baseE, calleeFnForwPassFD->getName(), CallArgs, calleeFnForwPassFD); @@ -1993,6 +2017,18 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, } } } + + if (opCode == UnaryOperatorKind::UO_Deref && + m_Mode == DiffMode::reverse_mode_forward_pass) { + if (const auto* MD = dyn_cast(m_Function)) { + if (MD->isInstance()) { + diff = Visit(UnOp->getSubExpr()); + Expr* cloneE = BuildOp(UnaryOperatorKind::UO_Deref, diff.getExpr()); + Expr* derivedE = diff.getExpr_dx(); + return {cloneE, derivedE}; + } + } + } // We should not output any warning on visiting boolean conditions // FIXME: We should support boolean differentiation or ignore it // completely @@ -3154,9 +3190,6 @@ Expr* getArraySizeExpr(const ArrayType* AT, ASTContext& context, if (m_Mode == DiffMode::reverse) assert(yType->isRealType() && "yType should be a non-reference builtin-numerical scalar type!!"); - else if (m_Mode == DiffMode::experimental_pullback) - assert(yType.getNonReferenceType()->isRealType() && - "yType should be a builtin-numerical scalar type!!"); QualType xValueType = utils::GetValueType(xType); // derivative variables should always be of non-const type. xValueType.removeLocalConst(); diff --git a/test/Gradient/MemberFunctions.C b/test/Gradient/MemberFunctions.C index a6ffeac36..3523b77ac 100644 --- a/test/Gradient/MemberFunctions.C +++ b/test/Gradient/MemberFunctions.C @@ -704,6 +704,10 @@ public: // CHECK-NEXT: } double& ref_mem_fn(double i) {return x;} + SimpleFunctions& operator+=(double value) { + x += value; + return *this; + } void mem_fn_grad(double i, double j, clad::array_ref _d_i, clad::array_ref _d_j); void const_mem_fn_grad(double i, double j, clad::array_ref _d_i, clad::array_ref _d_j); @@ -783,6 +787,44 @@ double fn2(SimpleFunctions& sf, double i) { // CHECK-NEXT: _t1.ref_mem_fn_pullback(_t0, 1, &(* _d_sf), &_grad0); // CHECK-NEXT: double _r0 = _grad0; // CHECK-NEXT: * _d_i += _r0; + +double fn3(SimpleFunctions& v, double value) { + v += value; + return v.x; +} + +// CHECK: void operator_plus_equal_pullback(double value, SimpleFunctions _d_y, clad::array_ref _d_this, clad::array_ref _d_value) { +// CHECK-NEXT: this->x += value; +// CHECK-NEXT: goto _label0; +// CHECK-NEXT: _label0: +// CHECK-NEXT: ; +// CHECK-NEXT: { +// CHECK-NEXT: double _r_d0 = (* _d_this).x; +// CHECK-NEXT: (* _d_this).x += _r_d0; +// CHECK-NEXT: * _d_value += _r_d0; +// CHECK-NEXT: (* _d_this).x -= _r_d0; +// CHECK-NEXT: } +// CHECK-NEXT: } + +// CHECK: clad::ValueAndAdjoint operator_plus_equal_forw(double value, clad::array_ref _d_this, clad::array_ref _d_value) { +// CHECK-NEXT: this->x += value; +// CHECK-NEXT: return {*this, (* _d_this)}; +// CHECK-NEXT: } + +// CHECK: void fn3_grad(SimpleFunctions &v, double value, clad::array_ref _d_v, clad::array_ref _d_value) { +// CHECK-NEXT: double _t0; +// CHECK-NEXT: SimpleFunctions _t1; +// CHECK-NEXT: _t0 = value; +// CHECK-NEXT: _t1 = v; +// CHECK-NEXT: clad::ValueAndAdjoint _t2 = _t1.operator_plus_equal_forw(_t0, &(* _d_v), nullptr); +// CHECK-NEXT: goto _label0; +// CHECK-NEXT: _label0: +// CHECK-NEXT: (* _d_v).x += 1; +// CHECK-NEXT: { +// CHECK-NEXT: double _grad0 = 0.; +// CHECK-NEXT: _t1.operator_plus_equal_pullback(_t0, {}, &(* _d_v), &_grad0); +// CHECK-NEXT: double _r0 = _grad0; +// CHECK-NEXT: * _d_value += _r0; // CHECK-NEXT: } // CHECK-NEXT: } @@ -821,12 +863,17 @@ int main() { printf("%.2f ",result[i]); //CHECK-EXEC: 40.00 16.00 } - SimpleFunctions sf(2, 3); + SimpleFunctions sf1(2, 3), sf2(3, 4); SimpleFunctions d_sf; + auto d_fn2 = clad::gradient(fn2); - d_fn2.execute(sf, 2, &d_sf, &result[0]); + d_fn2.execute(sf1, 2, &d_sf, &result[0]); printf("%.2f", result[0]); //CHECK-EXEC: 40.00 + auto d_fn3 = clad::gradient(fn3); + d_fn3.execute(sf2, 3, &d_sf, &result[0]); + printf("%.2f", result[0]); //CHECK-EXEC: 42.00 + auto d_const_volatile_lval_ref_mem_fn_i = clad::gradient(&SimpleFunctions::const_volatile_lval_ref_mem_fn, "i"); // CHECK: void const_volatile_lval_ref_mem_fn_grad_0(double i, double j, clad::array_ref _d_this, clad::array_ref _d_i) const volatile & {