|
| 1 | +module ChainRulesModule |
| 2 | + |
| 3 | +using ChainRulesCore: |
| 4 | + ChainRulesCore, AbstractTangent, NoTangent, ZeroTangent, Tangent, @thunk, canonicalize |
| 5 | +using ..OperatorEnumModule: OperatorEnum |
| 6 | +using ..EquationModule: AbstractExpressionNode, with_type_parameters, tree_mapreduce |
| 7 | +using ..EvaluateEquationModule: eval_tree_array |
| 8 | +using ..EvaluateEquationDerivativeModule: eval_grad_tree_array |
| 9 | + |
| 10 | +struct NodeTangent{T,N<:AbstractExpressionNode{T},A<:AbstractArray{T}} <: AbstractTangent |
| 11 | + tree::N |
| 12 | + gradient::A |
| 13 | +end |
| 14 | +function Base.:+(a::NodeTangent, b::NodeTangent) |
| 15 | + @assert a.tree == b.tree |
| 16 | + return NodeTangent(a.tree, a.gradient + b.gradient) |
| 17 | +end |
| 18 | +Base.:*(a::Number, b::NodeTangent) = NodeTangent(b.tree, a * b.gradient) |
| 19 | +Base.:*(a::NodeTangent, b::Number) = NodeTangent(a.tree, a.gradient * b) |
| 20 | +Base.zero(::Union{Type{NodeTangent},NodeTangent}) = ZeroTangent() |
| 21 | + |
| 22 | +function ChainRulesCore.rrule( |
| 23 | + ::typeof(eval_tree_array), |
| 24 | + tree::AbstractExpressionNode, |
| 25 | + X::AbstractMatrix, |
| 26 | + operators::OperatorEnum; |
| 27 | + turbo=Val(false), |
| 28 | + bumper=Val(false), |
| 29 | +) |
| 30 | + primal, complete = eval_tree_array(tree, X, operators; turbo, bumper) |
| 31 | + |
| 32 | + if !complete |
| 33 | + primal .= NaN |
| 34 | + end |
| 35 | + |
| 36 | + # TODO: Preferable to use the primal in the pullback somehow |
| 37 | + function pullback((dY, _)) |
| 38 | + dtree = let dY = dY, tree = tree, operators = operators |
| 39 | + @thunk( |
| 40 | + let |
| 41 | + _, gradient, complete = eval_grad_tree_array( |
| 42 | + tree, X, operators; variable=Val(false) |
| 43 | + ) |
| 44 | + if !complete |
| 45 | + gradient .= NaN |
| 46 | + end |
| 47 | + |
| 48 | + NodeTangent( |
| 49 | + tree, |
| 50 | + sum(j -> gradient[:, j] * dY[j], eachindex(dY, axes(gradient, 2))), |
| 51 | + ) |
| 52 | + end |
| 53 | + ) |
| 54 | + end |
| 55 | + dX = let dY = dY, tree = tree, operators = operators |
| 56 | + @thunk( |
| 57 | + let |
| 58 | + _, gradient, complete = eval_grad_tree_array( |
| 59 | + tree, X, operators; variable=Val(true) |
| 60 | + ) |
| 61 | + if !complete |
| 62 | + gradient .= NaN |
| 63 | + end |
| 64 | + |
| 65 | + gradient .* reshape(dY, 1, length(dY)) |
| 66 | + end |
| 67 | + ) |
| 68 | + end |
| 69 | + return (NoTangent(), dtree, dX, NoTangent()) |
| 70 | + end |
| 71 | + |
| 72 | + return (primal, complete), pullback |
| 73 | +end |
| 74 | + |
| 75 | +end |
0 commit comments