iVS3D/_tensor_8h_source.html

#pragma once


#include <variant>

#include <vector>

#include <cstdint>

#include <string>

#include <cmath>

#include <numeric>

#include <iostream>

#include <sstream>

#include <array>

#include <type_traits>

#include <utility>


#include <opencv2/core.hpp>

#include <opencv2/imgproc.hpp>


#include <tl/expected.hpp>


#include <ReduceOps.h>


#include "NeuralError.h"


namespace NN

{

    using Shape = std::vector<int64_t>;


    int64_t shapeNumElements(const Shape &shape);


    int64_t shapeToStride(const Shape &shape, uint64_t axis);


    std::string shapeToString(const Shape &shape);


    enum class TensorType

    {

        Float,  // float32

        Int64,  // int64_t

        UInt8,  // uint8_t

        Invalid // Invalid type, used for error handling

    };


    constexpr const char *toString(TensorType type)

    {

        switch (type)

        {

        case TensorType::Float:

            return "float32";

        case TensorType::Int64:

            return "int64";

        case TensorType::UInt8:

            return "uint8";

        default:

            return "Invalid";

        }

    };


    // --- Helper to extract std::array traits


    template <typename T>


    struct is_std_array : std::false_type

    {

    };


    template <typename U, std::size_t N>


    struct is_std_array<std::array<U, N>> : std::true_type

    {

        using value_type = U;

        static constexpr size_t size = N;

    };


    template <typename T>

    using decay_t = typename std::decay<T>::type;


    template <typename Func, typename InputElem>


    struct map_array_traits

    {

        using return_type = std::decay_t<std::invoke_result_t<Func, InputElem>>;

        static_assert(is_std_array<return_type>::value, "Function must return std::array");


        using value_type = typename is_std_array<return_type>::value_type;

        static constexpr size_t size = is_std_array<return_type>::size;

    };


    // --- End heplers


    class Tensor

    {

    public:

        using TensorData = std::variant<

            std::vector<float>,

            std::vector<int64_t>,

            std::vector<uint8_t>>;


        static tl::expected<Tensor, NeuralError> fromCvMat(const cv::Mat &mat);


        static tl::expected<Tensor, NeuralError> fromCvMat(const cv::Mat &mat, const Shape &shape, float scale = 1.0f, std::vector<float> mean = {}, std::vector<float> std = {});


        static tl::expected<Tensor, NeuralError> fromCvMats(const std::vector<cv::Mat> &mats);


        static tl::expected<Tensor, NeuralError> fromCvMats(const std::vector<cv::Mat> &mats, const Shape &shape, float scale = 1.0f, std::vector<float> mean = {}, std::vector<float> std = {});


        template <typename T>


        static tl::expected<Tensor, NeuralError> fromData(const std::vector<T> &data, const Shape &shape)

        {

            return fromData(std::vector<T>(data), shape); // delegates to move overload

        }


        template <typename T>


        static tl::expected<Tensor, NeuralError> fromData(std::vector<T> &&data, const Shape &shape)

        {

            if (static_cast<size_t>(shapeNumElements(shape)) != data.size())

            {

                return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "Data size does not match shape"));

            }


            Tensor t;

            t.m_shape = shape;

            t.m_data = std::move(data);

            return t;

        }


        template <typename T>


        tl::expected<std::vector<T>, NeuralError> toVector() const

        {

            if (std::holds_alternative<std::vector<T>>(m_data))

            {

                return std::get<std::vector<T>>(m_data);

            }

            return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "Tensor does not hold requested data type"));

        }


        tl::expected<cv::Mat, NeuralError> toCvMat() const;


        const Shape &shape() const { return m_shape; }


        std::string toString() const;


        tl::expected<void, NeuralError> reshape(const Shape &newShape);


        int64_t numElements() const;


        bool empty() const

        {

            return m_shape.empty() || shapeNumElements(m_shape) == 0;

        }


        TensorType dtype() const

        {

            return std::visit([](const auto &vec) -> TensorType

                              {

                using T = typename std::decay_t<decltype(vec)>::value_type;

                if constexpr (std::is_same_v<T, float>) {

                    return TensorType::Float;

                } else if constexpr (std::is_same_v<T, int64_t>) {

                    return TensorType::Int64;

                } else if constexpr (std::is_same_v<T, uint8_t>) {

                    return TensorType::UInt8;

                } else {

                    return TensorType::Invalid; // Unsupported type

                } }, m_data);

        };


        template <typename Op>


        tl::expected<Tensor, NeuralError> reduce(const Op &op, uint64_t axis) const

        {

            if (axis >= m_shape.size())

            {

                return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "Invalid reduction axis"));

            }


            return std::visit([&](const auto &inputVec) -> tl::expected<Tensor, NeuralError>

                              {

                using T = typename std::decay_t<decltype(inputVec)>::value_type;

                const int64_t D = m_shape.size();


                Shape outShape = m_shape;

                outShape[axis] = 1;


                std::vector<T> output(shapeNumElements(outShape));


                int64_t innerStride = shapeToStride(m_shape, axis);

                int64_t dimSize = m_shape[axis];

                int64_t outerStride = innerStride * dimSize;


                for (int64_t offset = 0; offset < inputVec.size(); offset += outerStride) {

                    for (int64_t i = 0; i < innerStride; ++i) {

                        // Compute flat index

                        int64_t outIdx = (offset / outerStride) * innerStride + i;

                        // Initialize accumulator

                        T acc = op.template initial<T>();

                        for (int64_t d = 0; d < dimSize; ++d) {

                            int64_t idx = offset + d * innerStride + i;

                            op(acc, inputVec[idx]); // Apply operation

                        }

                        output[outIdx] = acc;

                    }

                }

                return Tensor::fromData(std::move(output), outShape); }, m_data);

        }


        template <typename Op>


        tl::expected<Tensor, NeuralError> reduceWithIndex(const Op &op, uint64_t axis) const

        {

            if (axis >= m_shape.size())

            {

                return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "Invalid reduction axis"));

            }


            return std::visit([&](const auto &inputVec) -> tl::expected<Tensor, NeuralError>

                              {

                using T = typename std::decay_t<decltype(inputVec)>::value_type;


                Shape outShape = m_shape;

                outShape[axis] = 1;


                std::vector<int64_t> output(shapeNumElements(outShape));


                int64_t innerStride = shapeToStride(m_shape, axis);

                int64_t dimSize = m_shape[axis];

                int64_t outerStride = innerStride * dimSize;


                for (int64_t offset = 0; offset < inputVec.size(); offset += outerStride) {

                    for (int64_t i = 0; i < innerStride; ++i) {

                        int64_t outIdx = (offset / outerStride) * innerStride + i;

                        auto acc = op.template initial<T>();

                        for (size_t d = 0; d < dimSize; ++d) {

                            size_t idx = offset + d * innerStride + i;

                            op(acc, inputVec[idx], d);

                        }

                        output[outIdx] = static_cast<int64_t>(acc.first);

                    }

                }


                return Tensor::fromData(std::move(output), outShape); }, m_data);

        }


        template <typename Func>


        tl::expected<Tensor, NeuralError> map(Func &&f) const

        {

            return std::visit([&](const auto &inputVec) -> tl::expected<Tensor, NeuralError>

                              {

                                  using T = typename std::decay_t<decltype(inputVec)>::value_type;

                                  using V = std::decay_t<decltype(f(std::declval<T>()))>;


                                  std::vector<V> output;

                                  output.resize(inputVec.size());


                                  std::transform(inputVec.begin(), inputVec.end(), output.begin(),

                                                 [&](const T &val) -> V

                                                 {

                                                     return f(val);

                                                 });


                                  return Tensor::fromData(std::move(output), m_shape); },

                              m_data);

        }


        template <typename Func>


        tl::expected<Tensor, NeuralError> map(Func &&func, int axis) const

        {

            // Sanity check axis

            if (axis < 0 || axis > static_cast<int>(m_shape.size()))

            {

                return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "Invalid axis to insert new dimension."));

            }


            return std::visit([&](const auto &input) -> tl::expected<Tensor, NeuralError>

                              {

                using T = typename std::decay_t<decltype(input)>::value_type;

                using Traits = map_array_traits<Func, T>;

                using U = typename Traits::value_type;

                constexpr size_t N = Traits::size;


                if (input.empty()) {

                    return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "Tensor data is empty."));

                }


                // Compute the original and new shapes

                Shape newShape = m_shape;

                newShape.insert(newShape.begin() + axis, N);


                const int64_t oldSize = shapeNumElements(m_shape);

                const int64_t newSize = oldSize * N;


                std::vector<U> outData(newSize);


                // Precompute strides

                std::vector<int64_t> oldStrides = computeStrides(m_shape);

                std::vector<int64_t> newStrides = computeStrides(newShape);


                // Main loop: for each index in the old tensor, place mapped values in the new buffer

                for (int64_t idx = 0; idx < oldSize; ++idx) {

                    // Convert flat idx to N-dimensional index

                    std::vector<int64_t> coord = unravelIndex(idx, oldStrides);


                    // Apply function to get array<U, N>

                    auto mapped = func(input[idx]);


                    // Insert mapped[N] into new buffer at axis

                    coord.insert(coord.begin() + axis, 0);

                    for (int64_t i = 0; i < static_cast<int64_t>(N); ++i) {

                        coord[axis] = i;

                        int64_t flatIdx = ravelIndex(coord, newStrides);

                        outData[flatIdx] = mapped[i];

                    }

                }


                return Tensor::fromData(std::move(outData), newShape); }, m_data);

        }


        tl::expected<void, NeuralError> squeeze();


        tl::expected<void, NeuralError> squeeze(int64_t axis);


        tl::expected<void, NeuralError> unsqueeze(int64_t axis);


    private:

        TensorData m_data;

        Shape m_shape;


        static inline std::vector<int64_t> computeStrides(const Shape &shape)

        {

            std::vector<int64_t> strides(shape.size(), 1);

            for (int i = shape.size() - 2; i >= 0; --i)

                strides[i] = strides[i + 1] * shape[i + 1];

            return strides;

        }


        static inline std::vector<int64_t> unravelIndex(int64_t index, const std::vector<int64_t> &strides)

        {

            std::vector<int64_t> coords(strides.size());

            for (size_t i = 0; i < strides.size(); ++i)

            {

                coords[i] = index / strides[i];

                index %= strides[i];

            }

            return coords;

        }


        static inline int64_t ravelIndex(const std::vector<int64_t> &coords, const std::vector<int64_t> &strides)

        {

            int64_t index = 0;

            for (size_t i = 0; i < coords.size(); ++i)

                index += coords[i] * strides[i];

            return index;

        }


        template <typename T, int CV_TYPE>


        static tl::expected<Tensor, NeuralError> fromCvMatsTyped(const std::vector<cv::Mat> &mats)

        {

            if (mats.empty())

            {

                return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "Input vector of cv::Mat is empty"));

            }


            int channels = mats[0].channels();

            int height = mats[0].rows;

            int width = mats[0].cols;


            Shape shape = {static_cast<int64_t>(mats.size()), static_cast<int64_t>(channels), static_cast<int64_t>(height), static_cast<int64_t>(width)};

            auto totalSize = shapeNumElements(shape);


            std::vector<T> data;

            data.reserve(totalSize);


            for (const auto &mat : mats)

            {

                if (mat.depth() != CV_TYPE)

                {

                    return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "All cv::Mat must have the same data type"));

                }


                if (mat.channels() != channels || mat.rows != height || mat.cols != width)

                {

                    return tl::unexpected(NeuralError(ErrorCode::InvalidArgument, "All cv::Mat must have the same size and number of channels"));

                }


                std::vector<cv::Mat> splitted;

                cv::split(mat, splitted);


                for (int c = 0; c < channels; ++c)

                {

                    // data.insert(data.end(), splitted[c].datastart, splitted[c].dataend);

                    const T *channelData = splitted[c].ptr<T>();

                    data.insert(data.end(), channelData, channelData + height * width);

                }

            }


            return fromData(std::move(data), shape);

        }


        static cv::Mat preprocessCvMat(const cv::Mat &mat, const Shape &shape, float scale)

        {

            cv::Mat tmp;

            const cv::Mat *matPtr = &mat; // points to the mat were currently working with


            // if 3d, swap red and blue channels from BGR (opencv-standard) to RGB (anything else)

            if (mat.channels() == 3)

            {

                cv::cvtColor(*matPtr, tmp, cv::COLOR_BGR2RGB);

                matPtr = &tmp;

            }


            // resize if necessary

            cv::Size size(shape[shape.size() - 2], shape[shape.size() - 1]);

            if (size != cv::Size(-1,-1) && size != matPtr->size())

            {

                cv::resize(*matPtr, tmp, size, 0, 0, cv::INTER_AREA);

                matPtr = &tmp;

            }


            // convert to float and apply scale

            matPtr->convertTo(tmp, CV_32F, scale);

            return tmp;

        }


        static cv::Mat preprocessCvMat(const cv::Mat &mat, const Shape &shape, float scale, const std::vector<float> &mean, const std::vector<float> &std)

        {

            cv::Mat tmp = preprocessCvMat(mat, shape, scale); // first do the basic preprocessing


            // check if mean and std are provided and have the correct size

            assert(mean.size() == tmp.channels());

            assert(std.size() == tmp.channels());

            // check that std is not zero

            assert(std::all_of(std.begin(), std.end(), [](float s) { return s != 0.0f; }));


            // subtract mean from each channel

            int channels = tmp.channels();

            int rows = tmp.rows;

            int cols = tmp.cols * channels;


            if (tmp.isContinuous())

            {

                cols *= rows;

                rows = 1;

            }


            for (int i = 0; i < rows; ++i)

            {

                float *ptr = tmp.ptr<float>(i);

                for (int j = 0; j < cols; j += channels)

                {

                    for (int c = 0; c < channels; ++c)

                    {

                        ptr[j + c] = (ptr[j + c] - mean[c]) / std[c]; // apply mean and std

                    }

                }

            }


            return tmp;

        }


        friend class OrtNeuralNet;

    };


}


#ifndef TENSOR_DEBUG_PRINT

#ifdef NDEBUG

#define TENSOR_DEBUG_PRINT(tensor) ((void)0);

#else

#include <iostream>

#define TENSOR_DEBUG_PRINT(tensor) (std::cout << (tensor).toString() << std::endl);

#endif

#endif


#ifndef SHAPE_DEBUG_PRINT

#ifdef NDEBUG

#define SHAPE_DEBUG_PRINT(shape) ((void)0);

#else

#include <iostream>

#define SHAPE_DEBUG_PRINT(shape) (std::cout << NN::shapeToString(shape) << std::endl);

#endif

#endif


#ifndef RETURN_ON_ERROR

#define RETURN_ON_ERROR(expr, retVal)                            \

    do                                                           \

    {                                                            \

        auto _res = (expr);                                      \

        if (!_res)                                               \

        {                                                        \

            std::cerr << "Error: " << _res.error() << std::endl; \

            return (retVal);                                     \

        }                                                        \

    } while (0);

#endif

NeuralError.h
Defines error handling classes for the neural network module.

ReduceOps.h
Contains reduction operations for tensors such as sum, min, max, argmin, and argmax.

NN::NeuralError
Represents an error that occurred in the neural network module and contains the error type and messag...
Definition NeuralError.h:48

NN::OrtNeuralNet
A class that implements the NeuralNet interface using ONNX Runtime.
Definition OrtNeuralNet.h:58

NN::Tensor
A Tensor represents a N-dimensional array containing elements of the same type. Can be used as input ...
Definition Tensor.h:201

NN::Tensor::fromCvMats
static tl::expected< Tensor, NeuralError > fromCvMats(const std::vector< cv::Mat > &mats)
Create a new Tensor object from a vector of cv::Mat objects. The cv::Mat objects must have the same s...
Definition Tensor.cpp:158

NN::Tensor::reduceWithIndex
tl::expected< Tensor, NeuralError > reduceWithIndex(const Op &op, uint64_t axis) const
Reduce the Tensor along a given axis by applying an accumulative operation. The dimension in the rduc...
Definition Tensor.h:551

NN::Tensor::shape
const Shape & shape() const
Readonly access to the shape of the tensor. Valid tensors ensure the shape is static,...
Definition Tensor.h:405

NN::Tensor::empty
bool empty() const
Check if the tensor is empty, so to say it contains no elements.
Definition Tensor.h:435

NN::Tensor::reduce
tl::expected< Tensor, NeuralError > reduce(const Op &op, uint64_t axis) const
Reduce the Tensor along a given axis by applying an accumulative operation.
Definition Tensor.h:483

NN::Tensor::preprocessCvMat
static cv::Mat preprocessCvMat(const cv::Mat &mat, const Shape &shape, float scale)
Preprocess a cv::Mat to match the given shape by resizing, color conversion from BGR to RGB,...
Definition Tensor.h:826

NN::Tensor::fromData
static tl::expected< Tensor, NeuralError > fromData(const std::vector< T > &data, const Shape &shape)
Create a new Tensor object from a given data vector and shape. The number of elements in the vector m...
Definition Tensor.h:310

NN::Tensor::preprocessCvMat
static cv::Mat preprocessCvMat(const cv::Mat &mat, const Shape &shape, float scale, const std::vector< float > &mean, const std::vector< float > &std)
Preprocess a cv::Mat to match the given shape by resizing, color conversion from BGR to RGB,...
Definition Tensor.h:854

NN::Tensor::squeeze
tl::expected< void, NeuralError > squeeze()
Squeeze the Tensor by removing dimensions of size 1. This operation is performed inplace.
Definition Tensor.cpp:388

NN::Tensor::toCvMat
tl::expected< cv::Mat, NeuralError > toCvMat() const
Create a cv::Mat from a Tensor. In case of 2/3 dimensions this will convert back to CVs HWC layout....
Definition Tensor.cpp:249

NN::Tensor::dtype
TensorType dtype() const
Check the data type of the Tensor. This is deduced from the data type of the contained elements.
Definition Tensor.h:446

NN::Tensor::fromCvMat
static tl::expected< Tensor, NeuralError > fromCvMat(const cv::Mat &mat)
Create a new Tensor object from a cv::Mat. This will convert from CVs HWC layout to ONNX standard lay...
Definition Tensor.cpp:6

NN::Tensor::toVector
tl::expected< std::vector< T >, NeuralError > toVector() const
Create a vector containing the data from the Tensor.
Definition Tensor.h:383

NN::Tensor::toString
std::string toString() const
Create a human-readable string representation containing the Tensors shape and data type.
Definition Tensor.cpp:232

NN::Tensor::fromData
static tl::expected< Tensor, NeuralError > fromData(std::vector< T > &&data, const Shape &shape)
Create a new Tensor object from a given data vector and shape. The number of elements in the vector m...
Definition Tensor.h:340

NN::Tensor::map
tl::expected< Tensor, NeuralError > map(Func &&func, int axis) const
Map each element of the Tensor to an array of new values by applying a given function element-wise....
Definition Tensor.h:666

NN::Tensor::map
tl::expected< Tensor, NeuralError > map(Func &&f) const
Map each element of the Tensor to a new value by applying a given function element-wise....
Definition Tensor.h:615

NN::Tensor::unsqueeze
tl::expected< void, NeuralError > unsqueeze(int64_t axis)
Add a new dimension of size 1 at the specified axis.
Definition Tensor.cpp:406

NN::Tensor::numElements
int64_t numElements() const
Returns the number of elements contained in the Tensor.
Definition Tensor.cpp:355

NN::Tensor::fromCvMatsTyped
static tl::expected< Tensor, NeuralError > fromCvMatsTyped(const std::vector< cv::Mat > &mats)
Create a new Tensor object from a vector of cv::Mat objects with a specific type.
Definition Tensor.h:780

NN::Tensor::reshape
tl::expected< void, NeuralError > reshape(const Shape &newShape)
Reshape will interprete the data elements contained in the Tensor as a different shape....
Definition Tensor.cpp:325

NN::TensorType
TensorType
TensorType encapsulates the supported data types of tensor elements. The supported types are:
Definition Tensor.h:115

NN::Shape
std::vector< int64_t > Shape
Shape of a N-dimensional Tensor represented as the size in each dimension. Can be -1 in case of dynam...
Definition Tensor.h:75

NN
NN Neural Network Library containing Tensor and NeuralNet classes for inference.
Definition NeuralError.h:13

NN::shapeNumElements
int64_t shapeNumElements(const Shape &shape)
Calculates the number of elements from a given Shape.
Definition Tensor.cpp:360

NN::toString
constexpr const char * toString(TensorType type)
Convert the TensorType to a human-readable string.
Definition Tensor.h:128

NN::decay_t
typename std::decay< T >::type decay_t
Remove cv/ref qualifiers and decay to check std::array<T, N>
Definition Tensor.h:164

NN::shapeToString
std::string shapeToString(const Shape &shape)
Creates a human-readable string from the given shape.
Definition Tensor.cpp:365

NN::shapeToStride
int64_t shapeToStride(const Shape &shape, uint64_t axis)
Calculates the stride to iterate elements in a given axis.
Definition Tensor.cpp:379

NN::is_std_array
Checks if a type is a std::array.
Definition Tensor.h:150

NN::map_array_traits
Traits for mapping a function over a std::array.
Definition Tensor.h:171