latest/doxygen/Util_8hpp_source.html

// Copyright (c) 2016 Graphcore Ltd. All rights reserved.

#ifndef poputil_Util_hpp

#define poputil_Util_hpp


#include <algorithm>

#include <cassert>

#include <climits>

#include <poplar/Device.hpp>

#include <poplar/Graph.hpp>

#include <poplar/Interval.hpp>

#include <poplar/Program.hpp>

#include <poplar/Quarter.hpp>

#include <poplar/Target.hpp>

#include <poplar/Tensor.hpp>

#include <string>

#include <vector>


namespace poputil {


void mergeAdjacentRegions(std::vector<poplar::Interval> &regions);


void mergeAdjacentRegions(std::vector<std::vector<poplar::Interval>> &mapping);


std::vector<poplar::Interval>

flattenIntervals(const std::vector<std::vector<poplar::Interval>> &intervals);


std::vector<std::vector<poplar::Interval>>

splitRegions(const std::vector<poplar::Interval> &regions, unsigned grainSize,

             unsigned maxPartitions, unsigned minElementsPerPartition = 0,

             unsigned maxElementsPerPartition = UINT_MAX,

             unsigned maxElementsPerRegion = UINT_MAX);


std::vector<std::vector<poplar::Interval>> splitRegionsBetweenWorkers(

    const poplar::Target &target, const std::vector<poplar::Interval> &regions,

    unsigned grainSize, unsigned minElementsPerPartition = 0,

    unsigned maxElementsPerPartition = UINT_MAX,

    unsigned maxElementsPerRegion = UINT_MAX);


std::vector<std::vector<std::vector<poplar::Interval>>>

splitRegions(const std::vector<std::vector<poplar::Interval>> &regions,

             unsigned grainSize, unsigned maxPartitions,

             unsigned minElementsPerPartition = 0,

             unsigned maxElementsPerPartition = UINT_MAX,

             unsigned maxElementsPerRegion = UINT_MAX);


std::vector<std::vector<std::vector<poplar::Interval>>>

splitRegionsBetweenWorkers(

    const poplar::Target &target,

    const std::vector<std::vector<poplar::Interval>> &regions,

    unsigned grainSize, unsigned minElementsPerPartition = 0,

    unsigned maxElementsPerPartition = UINT_MAX,

    unsigned maxElementsPerRegion = UINT_MAX);


template <class T>

std::vector<T> unflattenIndex(const std::vector<T> &shape, std::size_t index) {

  std::vector<T> coord(shape.size());


  for (std::size_t i = shape.size(); i > 0; --i) {

    coord[i - 1] = index % shape[i - 1];

    index /= shape[i - 1];

  }


  assert(index == 0);

  return coord;

}


template <class T>

std::size_t flattenIndex(const std::vector<T> &shape,

                         const std::vector<T> &indices) {

  auto rank = shape.size();

  assert(indices.size() == rank);

  std::size_t index = 0;

  for (unsigned i = 0; i != rank; ++i) {

    index = index * shape[i] + indices[i];

  }

  return index;

}


std::size_t intervalSequenceNumElements(

    const std::vector<std::vector<poplar::Interval>> &seq);


poplar::Tensor

duplicate(poplar::Graph &graph, const poplar::Tensor &in,

          poplar::program::Sequence &p,

          const poplar::DebugContext &debugContext = {},

          poplar::TensorCloneMethod method =

              poplar::TensorCloneMethod::PRESERVE_ORDER_UNLESS_ALIASES);


poplar::Tensor

cloneN(poplar::Graph &graph, const poplar::Tensor &t, unsigned N,

       const poplar::DebugContext &debugContext = {},

       poplar::TensorCloneMethod method =

           poplar::TensorCloneMethod::PRESERVE_ORDER_UNLESS_ALIASES);


std::vector<int> balancedPartition(int rangeUpperBound, int splitCount);


double castToDeviceHalfValue(const poplar::Target &target, double input);


bool checkAccuracyWhenCast(const poplar::Target &target, double input,

                           poplar::Type inputType, poplar::Type outputType,

                           double tolerance);


poplar::Tensor factorDims(const poplar::Tensor &t,

                          const std::vector<std::size_t> &factors,

                          unsigned startDim = 0);


poplar::Tensor unfactorDims(const poplar::Tensor &t, unsigned numDims,

                            unsigned startDim = 0);


// Create metadata for use with FP8 data types

poplar::Tensor

createConstantMetadataTensor(poplar::Graph &graph,

                             poplar::QuarterMetadata::Format fp8Format,

                             int fp8Scale);


poplar::Tensor

createVariableMetadataTensor(poplar::Graph &graph,

                             poplar::QuarterMetadata::Format fp8Format,

                             int fp8Scale);


std::vector<poplar::Interval>

calculateUnshufflingIntervals(const std::vector<poplar::Interval> &intervals);


} // end namespace poputil


#endif // poputil_Util_hpp

poplar::DebugContext
DebugContext gathers the common external parameters of the context of an operation.
Definition: DebugContext.hpp:221

poplar::Graph
This class represents a graph program to be executed on the IPU.
Definition: Graph.hpp:52

poplar::Target
A target representation.
Definition: Target.hpp:69

poplar::Tensor
A reference to a subset of tensor elements.
Definition: Tensor.hpp:38

poplar::Type
Class representing device data types.
Definition: Type.hpp:42

poplar::program::Sequence
Program that executes a sequence of programs.
Definition: Program.hpp:77

poplar::TensorCloneMethod
TensorCloneMethod
Define behaviour when a Tensor is cloned.
Definition: TensorCloneMethod.hpp:13

poplar::TensorCloneMethod::PRESERVE_ORDER_UNLESS_ALIASES
@ PRESERVE_ORDER_UNLESS_ALIASES
Preserve the ordering of the original tensor unless it contains aliases.

poputil
General utility functions for building graphs.
Definition: GfloatExprUtil.hpp:23

poputil::intervalSequenceNumElements
std::size_t intervalSequenceNumElements(const std::vector< std::vector< poplar::Interval > > &seq)
Return the total number of elements in the interval sequence.

poputil::calculateUnshufflingIntervals
std::vector< poplar::Interval > calculateUnshufflingIntervals(const std::vector< poplar::Interval > &intervals)
Calculate the un-shuffling intervals based on the given intervals.

poputil::factorDims
poplar::Tensor factorDims(const poplar::Tensor &t, const std::vector< std::size_t > &factors, unsigned startDim=0)
Factors the outermost dimensions of tensor t by the values given in factors.

poputil::cloneN
poplar::Tensor cloneN(poplar::Graph &graph, const poplar::Tensor &t, unsigned N, const poplar::DebugContext &debugContext={}, poplar::TensorCloneMethod method=poplar::TensorCloneMethod::PRESERVE_ORDER_UNLESS_ALIASES)
Clone a tensor N times.

poputil::balancedPartition
std::vector< int > balancedPartition(int rangeUpperBound, int splitCount)
Split a range.

poputil::checkAccuracyWhenCast
bool checkAccuracyWhenCast(const poplar::Target &target, double input, poplar::Type inputType, poplar::Type outputType, double tolerance)
Check accuracy of a cast operation.

poputil::duplicate
poplar::Tensor duplicate(poplar::Graph &graph, const poplar::Tensor &in, poplar::program::Sequence &p, const poplar::DebugContext &debugContext={}, poplar::TensorCloneMethod method=poplar::TensorCloneMethod::PRESERVE_ORDER_UNLESS_ALIASES)
Copy a tensor's data to a new tensor.

poputil::flattenIntervals
std::vector< poplar::Interval > flattenIntervals(const std::vector< std::vector< poplar::Interval > > &intervals)
Flatten a vector of vectors of intervals to a vector, maintaining ordering.

poputil::splitRegionsBetweenWorkers
std::vector< std::vector< poplar::Interval > > splitRegionsBetweenWorkers(const poplar::Target &target, const std::vector< poplar::Interval > &regions, unsigned grainSize, unsigned minElementsPerPartition=0, unsigned maxElementsPerPartition=UINT_MAX, unsigned maxElementsPerRegion=UINT_MAX)
Given a set of contiguous regions per tile, partition these regions between workers on that tile whil...

poputil::flattenIndex
std::size_t flattenIndex(const std::vector< T > &shape, const std::vector< T > &indices)
Given a list of indices into a tensor, return the corresponding index in a flattened version of the t...
Definition: Util.hpp:96

poputil::unflattenIndex
std::vector< T > unflattenIndex(const std::vector< T > &shape, std::size_t index)
Given an index into a flattened tensor, returns the indices into the dimensions of the original tenso...
Definition: Util.hpp:81

poputil::unfactorDims
poplar::Tensor unfactorDims(const poplar::Tensor &t, unsigned numDims, unsigned startDim=0)
The opposite of factorDims().

poputil::splitRegions
std::vector< std::vector< poplar::Interval > > splitRegions(const std::vector< poplar::Interval > &regions, unsigned grainSize, unsigned maxPartitions, unsigned minElementsPerPartition=0, unsigned maxElementsPerPartition=UINT_MAX, unsigned maxElementsPerRegion=UINT_MAX)
Given a set of contiguous regions, partition these regions while trying to balance the number of elem...

poputil::castToDeviceHalfValue
double castToDeviceHalfValue(const poplar::Target &target, double input)
Cast a double precision value to a value exactly representable in device HALF type.