d1/dcb/preaccumulationHelper_8hpp_source.html

/*

 * CoDiPack, a Code Differentiation Package

 *

 * Copyright (C) 2015-2024 Chair for Scientific Computing (SciComp), University of Kaiserslautern-Landau

 * Homepage: http://www.scicomp.uni-kl.de

 * Contact:  Prof. Nicolas R. Gauger (codi@scicomp.uni-kl.de)

 *

 * Lead developers: Max Sagebaum, Johannes Blühdorn (SciComp, University of Kaiserslautern-Landau)

 *

 * This file is part of CoDiPack (http://www.scicomp.uni-kl.de/software/codi).

 *

 * CoDiPack is free software: you can redistribute it and/or

 * modify it under the terms of the GNU General Public License

 * as published by the Free Software Foundation, either version 3 of the

 * License, or (at your option) any later version.

 *

 * CoDiPack is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty

 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.

 *

 * See the GNU General Public License for more details.

 * You should have received a copy of the GNU

 * General Public License along with CoDiPack.

 * If not, see <http://www.gnu.org/licenses/>.

 *

 * For other licensing options please contact us.

 *

 * Authors:

 *  - SciComp, University of Kaiserslautern-Landau:

 *    - Max Sagebaum

 *    - Johannes Blühdorn

 *    - Former members:

 *      - Tim Albring

 */


#pragma once


#include <vector>


#include "../../config.h"

#include "../../expressions/lhsExpressionInterface.hpp"

#include "../../misc/exceptions.hpp"

#include "../../tapes/interfaces/fullTapeInterface.hpp"

#include "../../tapes/tagging/tagTapeReverse.hpp"

#include "../../traits/gradientTraits.hpp"

#include "../../traits/tapeTraits.hpp"

#include "../algorithms.hpp"

#include "../data/jacobian.hpp"


namespace codi {


  template<typename T_Type, typename = void>

  struct PreaccumulationHelper {

    public:


      using Type = CODI_DD(T_Type, CODI_DEFAULT_LHS_EXPRESSION);


      using Real = typename Type::Real;

      using Identifier = typename Type::Identifier;

      using Gradient = typename Type::Gradient;


      using Tape = CODI_DD(typename Type::Tape, CODI_DEFAULT_TAPE);

      using Position = typename Tape::Position;


      std::vector<Identifier> inputData;

      std::vector<Identifier> outputData;

      std::vector<Type*> outputValues;


    protected:


      Position startPos;

      std::vector<Gradient> storedAdjoints;

      JacobianCountNonZerosRow<Real> jacobian;


    public:


      PreaccumulationHelper()

          : inputData(), outputData(), outputValues(), startPos(), storedAdjoints(), jacobian(0, 0) {}


      template<typename... Inputs>

      void addInput(Inputs const&... inputs) {

        Tape& tape = Type::getTape();


        if (tape.isActive()) {

          addInputRecursive(inputs...);

        }

      }


      template<typename... Inputs>

      void start(Inputs const&... inputs) {

        Tape& tape = Type::getTape();


        EventSystem<Tape>::notifyPreaccStartListeners(tape);


        if (tape.isActive()) {

          inputData.clear();

          outputData.clear();

          outputValues.clear();


          startPos = tape.getPosition();


          addInputRecursive(inputs...);

        }

      }


      template<typename... Outputs>

      void addOutput(Outputs&... outputs) {

        Tape& tape = Type::getTape();


        if (tape.isActive()) {

          addOutputRecursive(outputs...);

        }

      }


      template<typename... Outputs>

      void finish(bool const storeAdjoints, Outputs&... outputs) {

        Tape& tape = Type::getTape();


        if (tape.isActive()) {

          addOutputRecursive(outputs...);


          if (storeAdjoints) {

            storeInputAdjoints();

          }


          tape.setPassive();

          doPreaccumulation();

          tape.setActive();


          if (storeAdjoints) {

            restoreInputAdjoints();

          }

        }


        EventSystem<Tape>::notifyPreaccFinishListeners(tape);

      }


    private:


      void addInputLogic(Type const& input) {

        EventSystem<Tape>::notifyPreaccAddInputListeners(Type::getTape(), input.getValue(), input.getIdentifier());

        Identifier const& identifier = input.getIdentifier();

        if (Type::getTape().getPassiveIndex() != identifier) {

          inputData.push_back(identifier);

        }

      }


      void addInputRecursive() {

        // Terminator implementation.

      }


      template<typename... Inputs>

      void addInputRecursive(Type const& input, Inputs const&... r) {

        addInputLogic(input);

        addInputRecursive(r...);

      }


      void addOutputLogic(Type& output) {

        EventSystem<Tape>::notifyPreaccAddOutputListeners(Type::getTape(), output.value(), output.getIdentifier());

        Identifier const& identifier = output.getIdentifier();

        if (Type::getTape().getPassiveIndex() != identifier) {

          outputData.push_back(identifier);

          outputValues.push_back(&output);

        }

      }


      void addOutputRecursive() {

        // Terminator implementation.

      }


      template<typename... Outputs>

      void addOutputRecursive(Type& output, Outputs&... r) {

        addOutputLogic(output);

        addOutputRecursive(r...);

      }


      void storeInputAdjoints() {

        Tape& tape = Type::getTape();


        if (storedAdjoints.size() < inputData.size()) {

          storedAdjoints.resize(inputData.size());

        }


        for (size_t i = 0; i < inputData.size(); ++i) {

          Identifier index = inputData[i];

          Gradient& adjoint = tape.gradient(index);

          storedAdjoints[i] = adjoint;

          adjoint = Gradient();

        }

      }


      void restoreInputAdjoints() {

        Tape& tape = Type::getTape();


        for (size_t i = 0; i < inputData.size(); ++i) {

          Identifier index = inputData[i];

          tape.gradient(index) = storedAdjoints[i];

        }

      }


      void doPreaccumulation() {

        // Perform the accumulation of the tape part.

        Tape& tape = Type::getTape();


        Position endPos = tape.getPosition();

        if (jacobian.getM() != outputData.size() || jacobian.getN() != inputData.size()) {

          jacobian.resize(outputData.size(), inputData.size());

        }


        // Manage adjoints manually to reduce the impact of locking on the performance.

        tape.resizeAdjointVector();

        tape.beginUseAdjointVector();


        Algorithms<Type, false>::computeJacobian(startPos, endPos, inputData.data(), inputData.size(),

                                                 outputData.data(), outputData.size(), jacobian,

                                                 AdjointsManagement::Manual);


        // Store the Jacobian matrix.

        tape.resetTo(startPos, true, AdjointsManagement::Manual);


        tape.endUseAdjointVector();


        for (size_t curOut = 0; curOut < outputData.size(); ++curOut) {

          Type& value = *outputValues[curOut];

          if (0 != jacobian.nonZerosRow(curOut)) {

            int nonZerosLeft = jacobian.nonZerosRow(curOut);

            jacobian.nonZerosRow(curOut) = 0;


            // We need to initialize with the output's current identifier such that it is correctly deleted in

            // storeManual.

            Identifier lastIdentifier = value.getIdentifier();

            bool staggeringActive = false;

            int curIn = 0;


            // Push statements as long as there are nonzeros left.

            // If there are more than MaxStatementIntValue nonzeros, then we need to stagger the

            // statement pushes:

            // e.g. The reverse mode of w = f(u0, ..., u530) which is \bar u_i += df/du_i * \bar w for i = 0 ... 530 is

            //      separated into

            //        Statement 1:

            //          \bar u_i += df/du_i * \bar t_1 for i = 0 ... 253   (254 entries)

            //        Statement 2:

            //          \bar t_1 += \bar w                                 (1 entry)

            //          \bar u_i += df/du_i * \bar t_2 for i = 254 ... 506 (253 entries)

            //        Statement 3:

            //          \bar t_2 += \bar w                                 (1 entry)

            //          \bar u_i += df/du_i * \bar w for i = 507 ... 530   (24 entries)

            //

            while (nonZerosLeft > 0) {

              // Calculate the number of Jacobians for this statement.

              int jacobiansForStatement = nonZerosLeft;

              if (jacobiansForStatement > (int)Config::MaxArgumentSize) {

                jacobiansForStatement = (int)Config::MaxArgumentSize - 1;

                if (staggeringActive) {  // Except in the first round, one Jacobian is reserved for the staggering.

                  jacobiansForStatement -= 1;

                }

              }

              nonZerosLeft -= jacobiansForStatement;  // Update nonzeros so that we know if it is the last round.


              Identifier storedIdentifier = lastIdentifier;

              // storeManual creates a new identifier which is either the identifier of the output w or the temporary

              // staggering variables t_1, t_2, ...

              tape.storeManual(value.getValue(), lastIdentifier, jacobiansForStatement + (int)staggeringActive);

              if (staggeringActive) {  // Not the first staggering so push the last output.

                tape.pushJacobianManual(1.0, 0.0, storedIdentifier);

              }


              // Push the rest of the Jacobians for the statement.

              while (jacobiansForStatement > 0) {

                if (Real() != (Real)jacobian(curOut, curIn)) {

                  tape.pushJacobianManual(jacobian(curOut, curIn), 0.0, inputData[curIn]);

                  jacobiansForStatement -= 1;

                }

                curIn += 1;

              }


              staggeringActive = true;

            }


            value.getIdentifier() = lastIdentifier; /* now set gradient data for the real output value */

          } else {

            // Disable tape index since there is no dependency.

            tape.destroyIdentifier(value.value(), value.getIdentifier());

          }

        }

      }

  };


#ifndef DOXYGEN_DISABLE

  struct PreaccumulationHelperNoOpBase {

    public:


      template<typename... Inputs>

      void addInput(Inputs const&... inputs) {

        CODI_UNUSED(inputs...);

        // Do nothing.

      }


      template<typename... Inputs>

      void start(Inputs const&... inputs) {

        CODI_UNUSED(inputs...);

        // Do nothing.

      }


      template<typename... Outputs>

      void addOutput(Outputs&... outputs) {

        CODI_UNUSED(outputs...);

        // Do nothing.

      }


      template<typename... Outputs>

      void finish(bool const storeAdjoints, Outputs&... outputs) {

        CODI_UNUSED(storeAdjoints, outputs...);

        // Do nothing.

      }

  };


  template<typename Type>

  struct PreaccumulationHelper<Type, TapeTraits::EnableIfForwardTape<typename Type::Tape>>

      : public PreaccumulationHelperNoOpBase {};


  template<>

  struct PreaccumulationHelper<double, void> : public PreaccumulationHelperNoOpBase {};


  template<typename T_Type>

  struct PreaccumulationHelper<

      T_Type, typename enable_if_same<typename T_Type::Tape,

                                      TagTapeReverse<typename T_Type::Real, typename T_Type::Tape::Tag>>::type> {

    public:


      using Type = CODI_DD(T_Type, CODI_DEFAULT_LHS_EXPRESSION);


      using Tape = CODI_DD(typename Type::Tape, CODI_T(TagTapeReverse<Type, int>));

      using Tag = typename Tape::Tag;


    private:


      std::vector<Type const*> inputLocations;

      std::vector<Type*> outputLocations;

      Tag oldTag;


    public:


      CODI_INLINE PreaccumulationHelper() = default;


      template<typename... Inputs>

      void addInput(Inputs const&... inputs) {

        Tape& tape = getTape();


        if (tape.isActive() && tape.isPreaccumulationHandlingEnabled()) {

          addInputRecursive(inputs...);

        }

      }


      template<typename... Inputs>

      void start(Inputs const&... inputs) {

        Tape& tape = getTape();


        if (tape.isActive() && tape.isPreaccumulationHandlingEnabled()) {

          inputLocations.clear();

          outputLocations.clear();

          oldTag = tape.getCurTag();

          tape.setCurTag(tape.getPreaccumulationHandlingTag());


          addInputRecursive(inputs...);

        }

      }


      template<typename... Outputs>

      void addOutput(Outputs&... outputs) {

        Tape& tape = getTape();


        if (tape.isActive() && tape.isPreaccumulationHandlingEnabled()) {

          addOutputRecursive(outputs...);

        }

      }


      template<typename... Outputs>

      void finish(bool const storeAdjoints, Outputs&... outputs) {

        Tape& tape = getTape();


        if (tape.isActive() && tape.isPreaccumulationHandlingEnabled()) {

          addOutputRecursive(outputs...);


          tape.setCurTag(oldTag);

          for (Type const* curInput : inputLocations) {

            tape.setTagOnVariable(*curInput);

          }

          for (Type* curOutput : outputLocations) {

            tape.setTagOnVariable(*curOutput);

          }

        }

      }


    private:


      void addInputRecursive() {

        // Terminator implementation.

      }


      template<typename... Inputs>

      void addInputRecursive(Type const& input, Inputs const&... r) {

        handleInput(input);

        addInputRecursive(r...);

      }


      void handleInput(Type const& input) {

        inputLocations.push_back(&input);

        getTape().setTagOnVariable(input);

      }


      void addOutputRecursive() {

        // Terminator implementation.

      }


      template<typename... Outputs>

      void addOutputRecursive(Type& output, Outputs&... r) {

        handleOutput(output);

        addOutputRecursive(r...);

      }


      void handleOutput(Type& value) {

        outputLocations.push_back(&value);

      }


      Tape& getTape() {

        return Type::getTape();

      }

  };

#endif

}

CODI_INLINE
#define CODI_INLINE
See codi::Config::ForcedInlines.
Definition: config.h:457

CODI_DD
#define CODI_DD(Type, Default)
Abbreviation for CODI_DECLARE_DEFAULT.
Definition: macros.hpp:94

CODI_T
#define CODI_T(...)
Abbreviation for CODI_TEMPLATE.
Definition: macros.hpp:111

codi::Config::MaxArgumentSize
size_t constexpr MaxArgumentSize
Maximum number of arguments in a statement.
Definition: config.h:120

codi::TapeTraits::EnableIfForwardTape
typename std::enable_if< IsForwardTape< Tape >::value >::type EnableIfForwardTape
Enable if wrapper for IsForwardTape.
Definition: tapeTraits.hpp:88

codi
CoDiPack - Code Differentiation Package.
Definition: codi.hpp:90

codi::CODI_UNUSED
void CODI_UNUSED(Args const &...)
Disable unused warnings for an arbitrary number of arguments.
Definition: macros.hpp:46

codi::enable_if_same
std::enable_if< std::is_same< T1, T2 >::value, R > enable_if_same
Enable if abbreviation for "std::is_same".
Definition: enableIfHelpers.hpp:51

codi::AdjointsManagement::Manual
@ Manual
Do not perform any bounds checking, locking, or resizing.

codi::Algorithms::computeJacobian
static void computeJacobian(Tape &tape, Position const &start, Position const &end, Identifier const *input, size_t const inputSize, Identifier const *output, size_t const outputSize, Jac &jac, AdjointsManagement adjointsManagement=AdjointsManagement::Automatic)
Compute the Jacobian with multiple tape sweeps.
Definition: algorithms.hpp:141

codi::EventSystem::notifyPreaccFinishListeners
static void notifyPreaccFinishListeners(Tape &tape)
Invoke callbacks for PreaccFinish events.
Definition: eventSystem.hpp:579

codi::EventSystem::notifyPreaccAddOutputListeners
static void notifyPreaccAddOutputListeners(Tape &tape, Real &value, Identifier &identifier)
Invoke callbacks for PreaccAddOutput events.
Definition: eventSystem.hpp:636

codi::EventSystem::notifyPreaccAddInputListeners
static void notifyPreaccAddInputListeners(Tape &tape, Real const &value, Identifier const &identifier)
Invoke callbacks for PreaccAddInput events.
Definition: eventSystem.hpp:607

codi::EventSystem::notifyPreaccStartListeners
static void notifyPreaccStartListeners(Tape &tape)
Invoke callbacks for PreaccStart events.
Definition: eventSystem.hpp:553

codi::JacobianCountNonZerosRow
Adds counting of nonzero entries.
Definition: jacobian.hpp:129

codi::JacobianCountNonZerosRow::nonZerosRow
int & nonZerosRow(size_t const i)
Reference to the number of nonzero entries for the specified row.
Definition: jacobian.hpp:167

codi::JacobianCountNonZerosRow::resize
void resize(size_t const m, size_t const n)
Resize the Jacobian.
Definition: jacobian.hpp:161

codi::Jacobian::getM
size_t getM() const
Get size of rows (output variables).
Definition: jacobian.hpp:78

codi::Jacobian::getN
size_t getN() const
Get size of columns (input variables).
Definition: jacobian.hpp:83

codi::PreaccumulationHelper
Stores the Jacobian matrix for a code section.
Definition: preaccumulationHelper.hpp:76

codi::PreaccumulationHelper::finish
void finish(bool const storeAdjoints, Outputs &... outputs)
Finish the preaccumulation region and perform the preaccumulation. See addOutput() for outputs.
Definition: preaccumulationHelper.hpp:149

codi::PreaccumulationHelper::storedAdjoints
std::vector< Gradient > storedAdjoints
If adjoints of inputs should be stored, before the preaccumulation.
Definition: preaccumulationHelper.hpp:100

codi::PreaccumulationHelper::startPos
Position startPos
Starting position for the region.
Definition: preaccumulationHelper.hpp:99

codi::PreaccumulationHelper::PreaccumulationHelper
PreaccumulationHelper()
Constructor.
Definition: preaccumulationHelper.hpp:106

codi::PreaccumulationHelper::addInput
void addInput(Inputs const &... inputs)
Add multiple additional inputs. Inputs need to be of type Type. Called after start().
Definition: preaccumulationHelper.hpp:111

codi::PreaccumulationHelper::Tape
typename Type::Tape Tape
See LhsExpressionInterface.
Definition: preaccumulationHelper.hpp:87

codi::PreaccumulationHelper::inputData
std::vector< Identifier > inputData
Definition: preaccumulationHelper.hpp:90

codi::PreaccumulationHelper::Position
typename Tape::Position Position
See PositionalEvaluationTapeInterface.
Definition: preaccumulationHelper.hpp:88

codi::PreaccumulationHelper::Identifier
typename Type::Identifier Identifier
See LhsExpressionInterface.
Definition: preaccumulationHelper.hpp:83

codi::PreaccumulationHelper::Gradient
typename Type::Gradient Gradient
See LhsExpressionInterface.
Definition: preaccumulationHelper.hpp:84

codi::PreaccumulationHelper::outputValues
std::vector< Type * > outputValues
Definition: preaccumulationHelper.hpp:94

codi::PreaccumulationHelper::Type
T_Type Type
See PreaccumulationHelper.
Definition: preaccumulationHelper.hpp:80

codi::PreaccumulationHelper::outputData
std::vector< Identifier > outputData
Definition: preaccumulationHelper.hpp:92

codi::PreaccumulationHelper::Real
typename Type::Real Real
See LhsExpressionInterface.
Definition: preaccumulationHelper.hpp:82

codi::PreaccumulationHelper::start
void start(Inputs const &... inputs)
Starts a preaccumulation region. Resets the internal state. See addInputs() for inputs.
Definition: preaccumulationHelper.hpp:121

codi::PreaccumulationHelper::addOutput
void addOutput(Outputs &... outputs)
Add multiple additional outputs. Outputs need to be of type Type. Called before finish().
Definition: preaccumulationHelper.hpp:139

codi::PreaccumulationHelper::jacobian
JacobianCountNonZerosRow< Real > jacobian
Jacobian for the preaccumulation.
Definition: preaccumulationHelper.hpp:101