latest/doxygen/Rnn_8hpp_source.html

// Copyright (c) 2021 Graphcore Ltd. All rights reserved.

#ifndef popnn_Rnn_hpp

#define popnn_Rnn_hpp


#include <cassert>

#include <cstdint>

#include <poplar/Graph.hpp>

#include <poplar/Program.hpp>

#include <poplar/Tensor.hpp>

#include <poputil/DebugInfo.hpp>


namespace popnn {

namespace rnn {


struct RnnParams {

  poplar::Type dataType;


  std::size_t batchSize;


  std::size_t maxTimeSteps;


  std::size_t timeSteps;


  poplar::Tensor varTimeSteps;


  std::vector<std::size_t> layerSizes;


  RnnParams(poplar::Type dataType, std::size_t batchSize, std::size_t timeSteps,

            std::vector<std::size_t> layerSizes);


  RnnParams(poplar::Type dataType, std::size_t batchSize,

            std::size_t maxTimeSteps, const poplar::Tensor &varTimeSteps,

            std::vector<std::size_t> layerSizes);


  // Return the maximum number of shards.

  std::size_t getMaxShards(const poplar::Graph &graph) const;


  // Return the number of bytes of the input per tile.

  std::size_t getInputBytesPerTile(const poplar::Graph &graph) const;


  // Return the number of bytes of the output per tile.

  std::size_t getOutputBytesPerTile(const poplar::Graph &graph) const;


  // Indicate that time steps are determined by tensor variable.

  bool variableTimeSteps() const;


  // Indicate that time steps are determined by tensor variable for each batch.

  bool batchVariableTimeSteps() const;

};


poplar::Tensor

createInitialState(poplar::Graph &graph, const RnnParams &params, bool isOutput,

                   unsigned multiple, unsigned numShards,

                   const poplar::DebugContext &debugContext = {});


poplar::Tensor

createRecurrentTensor(poplar::Graph &graph, const RnnParams &params,

                      unsigned size, unsigned numShards,

                      const poplar::DebugContext &debugContext = {});


poplar::Tensor createInputTensor(poplar::Graph &graph, const RnnParams &params,

                                 unsigned numShards,

                                 const poplar::DebugContext &debugContext = {});


poplar::Tensor

createOutputTensor(poplar::Graph &graph, const RnnParams &params,

                   unsigned numShards,

                   const poplar::DebugContext &debugContext = {});


poplar::Tensor

createOutputTensor(poplar::Graph &graph, const RnnParams &params,

                   unsigned multiple, unsigned numShards,

                   const poplar::DebugContext &debugContext = {});


poplar::Tensor shiftRnnTensor(poplar::Graph &graph, const RnnParams &params,

                              const poplar::Tensor &tBase,

                              const poplar::Tensor &tSingle,

                              poplar::program::Sequence &prog,

                              unsigned numShards,

                              const poplar::DebugContext &debugContext = {});


struct RnnSlice {

  std::vector<poplar::Tensor> inputs;

  poplar::Tensor interimIn;

  poplar::Tensor interimOut;

  std::vector<poplar::Tensor> outputs;

};


/* Flags set per batch if the current step is within the batchwise step limit.

 * The component tensor(s) are of type `dataType` and shape [`batchSize`].

 */

struct RnnBatchwiseFlags {

  poplar::Tensor mask;

  poplar::Tensor inverse;


  bool valid() const { return mask.valid(); };

};


struct TimeStepState {

  poplar::Tensor begin;

  poplar::Tensor counter;

  poplar::Tensor variableSeqFlag;

};


using LoopBodyType = std::function<poplar::program::Sequence(

    poplar::Graph &graph, const TimeStepState &time, const RnnBatchwiseFlags &,

    std::vector<poplar::Tensor> &, const RnnSlice &slice,

    std::vector<poplar::Tensor> &, poplar::program::Sequence *,

    const poplar::DebugNameAndId &)>;


using GatherBodyType = std::function<poplar::program::Sequence(

    poplar::Graph &graph, const RnnSlice &slice, unsigned stepsPerGather,

    poplar::program::Sequence *, const poplar::DebugNameAndId &)>;


struct StateSequence {

  poplar::Tensor output;

  std::size_t stateIndex;

};


std::vector<poplar::Tensor>

Rnn(poplar::Graph &graph, const RnnParams &params, bool reverse,

    const std::vector<poplar::Tensor> &initState,

    const StateSequence &stateSequence,

    const std::vector<poplar::Tensor> &inputs, const poplar::Tensor *interimIn,

    poplar::Tensor *interimOut, const std::vector<poplar::Tensor> &outputs,

    const std::vector<poplar::Tensor> &created, poplar::program::Sequence &prog,

    const LoopBodyType &loopFn, unsigned numShards,

    poplar::OptionFlags &options,

    const poplar::DebugContext &debugContext = {});


std::vector<poplar::Tensor>

Rnn(poplar::Graph &graph, const RnnParams &params,

    const std::vector<poplar::Tensor> &initState,

    const StateSequence &stateSequence,

    const std::vector<poplar::Tensor> &inputs, const poplar::Tensor &interimIn,

    const unsigned numTemps, poplar::program::Sequence &prog,

    const LoopBodyType &loopFn, const std::vector<poplar::Tensor> &gatherInputs,

    const GatherBodyType &gatherFn, unsigned numShards, unsigned stepsPerGather,

    poplar::OptionFlags &options,

    const poplar::DebugContext &debugContext = {});


} // namespace rnn

} // namespace popnn


#endif // #ifndef popnn_Rnn_hpp

DebugInfo.hpp
Poplibs generic debug info structure.

poplar::DebugContext
DebugContext gathers the common external parameters of the context of an operation.
Definition: DebugContext.hpp:221

poplar::DebugNameAndId
DebugNameAndId bundles a name and a DebugId to facilitate their propagation through function calls.
Definition: DebugContext.hpp:142

poplar::Graph
This class represents a graph program to be executed on the IPU.
Definition: Graph.hpp:52

poplar::OptionFlags
A set of option/value string flags to be used in various APIs.
Definition: OptionFlags.hpp:24

poplar::Tensor
A reference to a subset of tensor elements.
Definition: Tensor.hpp:38

poplar::Type
Class representing device data types.
Definition: Type.hpp:42

poplar::program::Sequence
Program that executes a sequence of programs.
Definition: Program.hpp:77

popnn::rnn::createRecurrentTensor
poplar::Tensor createRecurrentTensor(poplar::Graph &graph, const RnnParams &params, unsigned size, unsigned numShards, const poplar::DebugContext &debugContext={})
Create recurrent tensor of shape [timeSteps, batchSize, size] suitable for slicing and/or sharding of...

popnn::rnn::createOutputTensor
poplar::Tensor createOutputTensor(poplar::Graph &graph, const RnnParams &params, unsigned numShards, const poplar::DebugContext &debugContext={})
Create a standard output tensor of shape [timeSteps, batchSize, outputSize] suitable for slicing and/...

popnn::rnn::shiftRnnTensor
poplar::Tensor shiftRnnTensor(poplar::Graph &graph, const RnnParams &params, const poplar::Tensor &tBase, const poplar::Tensor &tSingle, poplar::program::Sequence &prog, unsigned numShards, const poplar::DebugContext &debugContext={})
Create a single-step shifted RNN tensor from an input tensor.

popnn::rnn::createInputTensor
poplar::Tensor createInputTensor(poplar::Graph &graph, const RnnParams &params, unsigned numShards, const poplar::DebugContext &debugContext={})
Create input tensor of shape [timeSteps, batchSize, inputSize] suitable for slicing and/or sharding o...

popnn::rnn::Rnn
std::vector< poplar::Tensor > Rnn(poplar::Graph &graph, const RnnParams &params, bool reverse, const std::vector< poplar::Tensor > &initState, const StateSequence &stateSequence, const std::vector< poplar::Tensor > &inputs, const poplar::Tensor *interimIn, poplar::Tensor *interimOut, const std::vector< poplar::Tensor > &outputs, const std::vector< poplar::Tensor > &created, poplar::program::Sequence &prog, const LoopBodyType &loopFn, unsigned numShards, poplar::OptionFlags &options, const poplar::DebugContext &debugContext={})
Run custom Recurrent Neural Net cell implementation recurrently.

popnn::rnn::createInitialState
poplar::Tensor createInitialState(poplar::Graph &graph, const RnnParams &params, bool isOutput, unsigned multiple, unsigned numShards, const poplar::DebugContext &debugContext={})
Create state tensor to be used in all recurrences of the RNN.

popnn::rnn::LoopBodyType
std::function< poplar::program::Sequence(poplar::Graph &graph, const TimeStepState &time, const RnnBatchwiseFlags &, std::vector< poplar::Tensor > &, const RnnSlice &slice, std::vector< poplar::Tensor > &, poplar::program::Sequence *, const poplar::DebugNameAndId &)> LoopBodyType
Create loop body function for the given shard.
Definition: Rnn.hpp:238

popnn::rnn::GatherBodyType
std::function< poplar::program::Sequence(poplar::Graph &graph, const RnnSlice &slice, unsigned stepsPerGather, poplar::program::Sequence *, const poplar::DebugNameAndId &)> GatherBodyType
Create gather body function for the given shard.
Definition: Rnn.hpp:253

popnn
Functions used in neural networks.
Definition: BatchNorm.hpp:14

popnn::rnn::RnnParams
Structure of Recurrent Neural Network (RNN) parameters which allows for any customized implementation...
Definition: Rnn.hpp:22

popnn::rnn::RnnParams::maxTimeSteps
std::size_t maxTimeSteps
The maximum number of RNN time steps.
Definition: Rnn.hpp:30

popnn::rnn::RnnParams::layerSizes
std::vector< std::size_t > layerSizes
For each RNN layer, the layer size parameter needs to be specified for the input and the output.
Definition: Rnn.hpp:45

popnn::rnn::RnnParams::dataType
poplar::Type dataType
The datatype used for the RNN.
Definition: Rnn.hpp:24

popnn::rnn::RnnParams::timeSteps
std::size_t timeSteps
Definition: Rnn.hpp:33

popnn::rnn::RnnParams::varTimeSteps
poplar::Tensor varTimeSteps
The run-time number of RNN time steps of dimension [batchSize] If this tensor is default constructed,...
Definition: Rnn.hpp:39

popnn::rnn::RnnParams::batchSize
std::size_t batchSize
The batch size.
Definition: Rnn.hpp:27

popnn::rnn::RnnSlice
Tensors required for processing a single time step.
Definition: Rnn.hpp:192

popnn::rnn::StateSequence
Structure that associates a particular state tensor with a user-defined output tensor.
Definition: Rnn.hpp:264