docs/cpp/model__spec_8hpp_source.html

 /* Copyright © 2018 Apple Inc. All rights reserved.
  *
  * Use of this source code is governed by a BSD-3-clause license that can
  * be found in the LICENSE.txt file or at https://opensource.org/licenses/BSD-3-Clause
  */

 #ifndef UNITY_TOOLKITS_NEURAL_NET_MODEL_SPEC_HPP_
 #define UNITY_TOOLKITS_NEURAL_NET_MODEL_SPEC_HPP_

 #include <array>
 #include <functional>
 #include <memory>
 #include <string>
 #include <vector>

 #include <ml/neural_net/float_array.hpp>
 #include <ml/neural_net/weight_init.hpp>

 // Forward declare CoreML::Specification::NeuralNetwork in lieu of including
 // problematic protocol buffer headers.
 namespace CoreML {
 namespace Specification {
 class NeuralNetwork;
 class Pipeline;
 class WeightParams;
 }
 }

 namespace turi {
 namespace neural_net {

 /**
  * Representation for a neural-network model (structure and parameters),
  * optimized for convenient export to CoreML.
  *
  * This class just wraps CoreML::Specification::NeuralNetwork, helping to
  * insulate toolkits from protobuf code.
  */
 class model_spec {
 public:

   /** Parameter for convolution and pooling layers. */
   enum class padding_type {
     VALID,
     SAME,
   };

   /** Parameter for the padding layer */
   enum class padding_policy {
     REFLECTIVE,
     REPLICATION,
     ZERO,
   };

   /** Parameter for pooling types. */
   enum class pooling_type { MAX, AVERAGE, L2 };

   /**
    * Creates an empty model_spec (with no layers).
    */
   model_spec();

   /**
    * Initializes a model_spec from a NeuralNetwork proto.
    */
   model_spec(const CoreML::Specification::NeuralNetwork& nn_model);

   /**
    * Initializes a model_spec from the top-level NeuralNetwork found inside a
    * CoreML model specification on disk.
    *
    * \param mlmodel_path Path to a CoreM::Specification::Model proto on disk.
    * \throw If the indicated path could not be read or parsed.
    */
   model_spec(const std::string& mlmodel_path);

   // Declared here and defined in the .cpp file just to prevent the implicit
   // default destructor from attempting (and failing) to instantiate
   // std::unique_ptr<NeuralNetwork>::~unique_ptr()
   model_spec(model_spec&&);
   model_spec& operator=(model_spec&&);
   ~model_spec();

   /**
    * Exposes the underlying CoreML proto.
    */
   const CoreML::Specification::NeuralNetwork& get_coreml_spec() const {
     return *impl_;
   }

   /**
    * Transfer ownership of the underlying CoreML proto, invalidating the current
    * instance (leaving it in a "moved-from" state).
    *
    * (Note that this method may only be invoked from a model_spec&&)
    */
   std::unique_ptr<CoreML::Specification::NeuralNetwork> move_coreml_spec() &&;

   /**
    * Creates a shared_float_array view (weak reference) into the parameters of
    * the model, indexed by layer name.
    *
    * \return A dictionary whose keys are of the form
    *         "$layername_$paramname". The layer names are taken from the name
    *         field of each NeuralNetworkLayer containing a supported layer. The
    *         supported layers are ConvolutionLayerParams (with params "weight"
    *         (in NCHW order) and "bias") and BatchnormLayerParams (with params
    *         "gamma", "beta", "running_mean", and "running_var").
    * \throw If a NeuralNetworkLayer in the specification seems malformed
    *        (e.g. WeightParams with size inconsistent with declared layer
    *        shape).
    *
    * To avoid copying data, the data backing the shared_float_array instances in
    * the return value will only remain valid for the lifetime of this instance!
    */
   float_array_map export_params_view() const;

   /**
    * Overwrites existing WeightParams values using the provided float_array
    * values.
    *
    * \param weights A dictionary whose keys follow the same naming scheme used
    *                by `export_params_view`.
    * \param use_quantization If true, weights are stored in half precision.
    * \throw If a float_array's shape does not match the corresponding
    *        NeuralNetworkLayer.
    */
   void update_params(const float_array_map& weights, bool use_quantization = false);

   /**
    * Determines whether the neural network contains a layer with the given
    * output name.
    *
    * In general, it is only safe to add a new layer that takes a named input if
    * this method returns true for that name.
    */
   bool has_layer_output(const std::string& layer_name) const;

   /**
    * Appends a ReLU activation layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    */
   void add_relu(const std::string& name, const std::string& input);

   /**
    * Appends a leaky ReLU activation layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param alpha Multiplied to negative inputs
    */
   void add_leakyrelu(const std::string& name, const std::string& input,
                      float alpha);

   /**
    * Appends a sigmoid activation layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    */
   void add_sigmoid(const std::string& name, const std::string& input);

   /**
    * Appends a pooling layer.
    * By default, it's a max pooling layer.
    *
    * It can be of type:
    *      - MAX
    *      - AVERAGE
    *      - L2
    *
    * \param pooling this sets the type of pooling this layer performs.
    * \param use_poolexcludepadding padded values are excluded from the
    * count (denominator) when computing average pooling.
    */
   void add_pooling(const std::string& name, const std::string& input, size_t kernel_height,
                    size_t kernel_width, size_t stride_h, size_t stride_w, padding_type padding,
                    bool use_poolexcludepadding = false, pooling_type pooling = pooling_type::MAX);

   /**
    * Appends a convolution layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param num_output_channels The number of distinct filters in this layer
    * \param num_kernel_channels The number of input features per "pixel"
    * \param kernel_size The height and width of the kernel
    * \param weight_initializer_fn Callback used to initialize the conv weights
    * \param bias_initializer_fn Callback used to initialize the conv bias. If
    *                            nullptr, then no bias vector is set.
    */
   void add_convolution(const std::string& name, const std::string& input,
                        size_t num_output_channels, size_t num_kernel_channels,
                        size_t kernel_height, size_t kernel_width,
                        size_t stride_h, size_t stride_w, padding_type padding,
                        weight_initializer weight_initializer_fn,
                        weight_initializer bias_initializer_fn = nullptr);

   /**
    * Appends a padding layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param padding_top The padding on the top
    * \param padding_bottom The padding on the bottom
    * \param padding_left The padding to the left
    * \param padding_right The padding to the right
    * \param policy The padding policy of zero, reflective, or replication
    */
   void add_padding(const std::string& name, const std::string& input,
                    size_t padding_top, size_t padding_bottom,
                    size_t padding_left, size_t padding_right,
                    padding_policy policy = padding_policy::REFLECTIVE);

   /**
    * Appends an upsampling layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param scaling_x The upsample scale on the x axis
    * \param scaling_y The upsample scale on the y axis
    */
   void add_upsampling(const std::string& name, const std::string& input,
                       size_t scaling_x, size_t scaling_y);

   /**
    * Appends an inner-product (dense, fully connected) layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param num_output_channels Size of the output vector
    * \param num_input_channels Size of the input vector
    * \param weight_initializer_fn Callback used to initialize the weights
    * \param bias_initializer_fn Callback used to initialize the bias. If
    *            nullptr, then no bias vector is set.
    */
   void add_inner_product(const std::string& name, const std::string& input,
                          size_t num_output_channels, size_t num_input_channels,
                          weight_initializer weight_initializer_fn,
                          weight_initializer bias_initializer_fn = nullptr);

   /**
    * Appends a batch norm layer.
    *
    * The beta and mean parameters are initialized to 0.f; the gamma and variance
    * parameters are initialized to 1.f
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param num_channels The C dimension of the input and output
    * \param epsilon Added to the variance for each input before normalizing
    */
   void add_batchnorm(const std::string& name, const std::string& input,
                      size_t num_channels, float epsilon);

   /**
    * Appends an instance norm layer.
    *
    * The beta is initialized to 0.f; the gamma is initialized to 1.f
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param num_channels The C dimension of the input and output
    * \param epsilon Added to the variance for each input before normalizing
    */
   void add_instancenorm(const std::string& name, const std::string& input,
                         size_t num_channels, float epsilon);

   /**
    * Appends a layer that concatenates its inputs along the channel axis.
    *
    * \param name The name of the layer and its output
    * \param inputs The names of the layer's inputs
    */
   void add_channel_concat(const std::string& name,
                           const std::vector<std::string>& inputs);

   /**
    * Appends a layer that performs softmax normalization (along channel axis).
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    */
   void add_softmax(const std::string& name, const std::string& input);

   /**
    * Appends a layer that performs flatten normalization (along channel axis).
    *
    * currently only supports channel first flattening, which means if the input order is
    * ``[C, H, W]``, then output array will be ``[C * H * W, 1, 1]``, still `C-major`
    * orderring. No underlying array storage will be changed.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    */
   void add_flatten(const std::string& name, const std::string& input);

   /**
    * Appends a layer that performs elementwise addition.
    *
    * \param name The name of the layer and its output
    * \param inputs The names of the layer's inputs
    */
   void add_addition(const std::string& name,
                     const std::vector<std::string>& inputs);

   /**
    * Appends a layer that performs elementwise multiplication.
    *
    * \param name The name of the layer and its output
    * \param inputs The names of the layer's inputs
    */
   void add_multiplication(const std::string& name,
                           const std::vector<std::string>& inputs);

   /**
    * Appends a layer that applies the unary function f(x) = e^x to its input.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    */
   void add_exp(const std::string& name, const std::string& input);


   /**
    * Appends a layer that performs elementwise multiplication between its input
    * and some fixed weights.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param shape_c_h_w The shape of the input and output
    * \param weight_initializer_fn Callback used to initialize the weights
    */
   void add_scale(const std::string& name, const std::string& input,
                  const std::vector<size_t>& shape_c_h_w,
                  weight_initializer scale_initializer_fn);

   /**
    * Appends a layer with fixed values.
    *
    * \param name The name of the layer and its output
    * \param shape_c_h_w The shape of the output
    * \param weight_initializer_fn Callback used to initialize the weights
    */
   void add_constant(const std::string& name,
                     const std::array<size_t, 3>& shape_c_h_w,
                     weight_initializer weight_initializer_fn);

   /**
    * Appends a layer that reshapes its input.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param shape_c_h_w The shape of the output
    */
   void add_reshape(const std::string& name, const std::string& input,
                    const std::array<size_t, 4>& seq_c_h_w);

   /**
    * Appends a layer that transposes the dimensions of its input
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param axis_permutation A permutation of [0, 1, 2, 3], describing how to
    *            rearrange the [Seq, C, H, W] input.
    */
   void add_permute(const std::string& name, const std::string& input,
                    const std::array<size_t, 4>& axis_permutation);

   /**
    * Appends a layer that slices the input along the channel axis.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param start_index The first channel to include
    * \param end_index The first channel to stop including. If negative, then the
    *            number of channels is added first (so -1 becomes n - 1).
    * \param stride The interval between channels to include
    */
   void add_channel_slice(const std::string& name, const std::string& input,
                          int start_index, int end_index, size_t stride);

   /**
    * Appends an LSTM layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param hidden_input The name of the initial hidden state
    * \param cell_input The name of the initial cell state
    * \param hidden_output The name of the resulting hidden state
    * \param cell_output The name of the resulting cell state
    * \param input_vector_size The size of the input vector
    * \param output_vector_size The size of the output vector (hidden state and
    *            cell state)
    * \param cell_clip_threshold Maximum magnitude of cell state values
    * \param initializers LSTM weights
    */
   void add_lstm(const std::string& name, const std::string& input,
                 const std::string& hidden_input, const std::string& cell_input,
                 const std::string& hidden_output,
                 const std::string& cell_output, size_t input_vector_size,
                 size_t output_vector_size, float cell_clip_threshold,
                 const lstm_weight_initializers& initializers);

   // TODO: Support additional layers (and further parameterize the above) as
   // needed. If/when we support the full range of NeuralNetworkLayer values,
   // this could be shared in some form with coremltools.

   /**
    * Appends a preprocessing layer
    * Now only support image scaling preprocessing though.
    */
   void add_preprocessing(const std::string& feature_name,
                          const float image_scale);

   /**
    * Appends an Transpose layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param axes The ordering of the axes to transpose for instance {0, 2, 1, 3}
    *             would flip the channel and height axes
    */
   void add_transpose(const std::string& name, const std::string& input,
                      std::vector<size_t> axes);

   /**
    * Appends an Split layer.
    *
    * \param name The name of the layer and its output
    * \param input The name of the layer's input
    * \param axis The axis to split the layer on
    * \param num_splits The number of splits to perform
    * \param split_sizes The size of each split
    */
   void add_split_nd(const std::string& name, const std::string& input,
                     size_t axis, size_t num_splits,
                     const std::vector<size_t>& split_sizes);

   /**
    * Appends an Concat layer.
    *
    * \param name The name of the layer and its output
    * \param inputs The vector of names of the layer's inputs
    * \param axis The axis to concat the layer on
    */
   void add_concat_nd(const std::string& name,
                      const std::vector<std::string>& inputs, size_t axis);

   /**
    * Appends a Reshape Static layer.
    *
    * \param name The name of the layer and its output
    * \param input The vector of names of the layer's input
    * \param targetShape The target shape
    */
   void add_reshape_static(const std::string& name, const std::string& input,
                           const std::vector<size_t>& targetShape);

   /**
    * Appends a Reshape Dynamic layer.
    *
    * \param name The name of the layer and its output
    * \param inputs The vector of names of the layer's inputs
    */
   void add_reshape_dynamic(const std::string& name,
                            const std::vector<std::string>& inputs);

   /**
    * Appends an Expand Dims layer.
    *
    * \param name The name of the layer and its output
    * \param input The vector of names of the layer's input
    * \param axes The axes to expand the layer on
    */
   void add_expand_dims(const std::string& name, const std::string& input,
                        const std::vector<size_t>& axes,
                        const std::vector<size_t>& inputVector,
                        const std::vector<size_t>& outputVector);

   /**
    * Appends a Squeeze layer.
    *
    * \param name The name of the layer and its output
    * \param input The vector of names of the layer's input
    * \param axes The axes to squeeze the layer on
    */
   void add_squeeze(const std::string& name, const std::string& input,
                    const std::vector<size_t>& axes,
                    const std::vector<size_t>& inputVector,
                    const std::vector<size_t>& outputVector);

   /**
    * Appends an Add Broadcastable layer.
    *
    * \param name The name of the layer and its output
    * \param inputs The vector of names of the layer's inputs
    */
   void add_add_broadcastable(const std::string& name,
                              const std::vector<std::string>& inputs);

   /**
    * Appends a Gather layer.
    *
    * \param name The name of the layer and its output
    * \param inputs The vector of names of the layer's inputs
    */
   void add_gather(const std::string& name,
                   const std::vector<std::string>& inputs);

   /**
    * Appends a Constant ND layer.
    *
    * \param name The name of the layer and its output
    * \param shape The shape of the constant layer
    * \param data The data being loaded in the constant layer
    */
   void add_constant_nd(const std::string& name,
                        const std::vector<size_t>& shape,
                        const weight_initializer& data);

   /**
    * Appends a Get Shape layer.
    *
    * \param name The name of the layer and its output
    * \param input The vector of names of the layer's input
    */
   void add_get_shape(const std::string& name, const std::string& input);

   /**
    * Appends dynamic slicing.
    *
    * \param name The name of the layer and its output
    * \param inputs The name of the layer's inputs
    */
   void add_slice_dynamic(const std::string& name, const std::vector<std::string>& inputs);

   /**
    * Appends a non maximum suppression  layer.
    *
    * \param name The name of the layer and its output
    * \param inputs The name of the layer's inputs
    * \param outputs The outputs of the layer
    * \param iou_thrsshold The default value for the iou threshold
    * \param confidence_threshold The default value for the confidence threshold
    * \param max_boxes The maximum number of boxes you want NMS to run
    * \param per_class_suppression When false, suppression happens for all
    * classes.
    */
   void add_nms_layer(const std::string& name, const std::vector<std::string>& inputs,
                      const std::vector<std::string>& outputs, float iou_threshold,
                      float confidence_threshold, size_t max_boxes, bool per_class_supression);

  private:
   std::unique_ptr<CoreML::Specification::NeuralNetwork> impl_;
 };

 /**
  * Simple wrapper around CoreML::Specification::Pipeline that allows client code
  * to pass around instances without importing full protobuf headers.
  *
  * \todo As needed, elaborate this class and move into its own file.
  */
 class pipeline_spec {
  public:
   pipeline_spec(std::unique_ptr<CoreML::Specification::Pipeline> impl);

   pipeline_spec(pipeline_spec&&);
   pipeline_spec& operator=(pipeline_spec&&);

   // Declared here and defined in the .cpp file just to prevent the implicit
   // default destructor from attempting (and failing) to instantiate
   // std::unique_ptr<Pipeline>::~unique_ptr()
   ~pipeline_spec();

   /**
    * Exposes the underlying CoreML proto.
    */
   const CoreML::Specification::Pipeline& get_coreml_spec() const {
     return *impl_;
   }

   /**
    * Transfer ownership of the underlying CoreML proto, invalidating the current
    * instance (leaving it in a "moved-from" state).
    *
    * (Note that this method may only be invoked from a pipeline_spec&&)
    */
   std::unique_ptr<CoreML::Specification::Pipeline> move_coreml_spec() &&;

  private:
   std::unique_ptr<CoreML::Specification::Pipeline> impl_;
 };

 }  // neural_net
 }  // turi

 #endif  // UNITY_TOOLKITS_NEURAL_NET_MODEL_SPEC_HPP_
turi::neural_net::lstm_weight_initializers
Definition: weight_init.hpp:123

turi::neural_net::model_spec
Definition: model_spec.hpp:40

turi::neural_net::pipeline_spec::get_coreml_spec
const CoreML::Specification::Pipeline & get_coreml_spec() const
Definition: model_spec.hpp:582

turi::neural_net::model_spec::get_coreml_spec
const CoreML::Specification::NeuralNetwork & get_coreml_spec() const
Definition: model_spec.hpp:88

turi::neural_net::model_spec::padding_policy
padding_policy
Definition: model_spec.hpp:50

turi
SKD.
Definition: capi_initialization.hpp:11

turi::neural_net::model_spec::padding_type
padding_type
Definition: model_spec.hpp:44

turi::neural_net::model_spec::pooling_type
pooling_type
Definition: model_spec.hpp:57

turi::neural_net::pipeline_spec
Definition: model_spec.hpp:567

CoreML
Definition: model_spec.hpp:22