theoretica/dataset_8h_source.html

#ifndef THEORETICA_DATASET_H

#define THEORETICA_DATASET_H


#ifndef THEORETICA_NO_PRINT

#include <sstream>

#include <ostream>

#endif


#include "./core_traits.h"

#include "./constants.h"

#include "./error.h"


namespace theoretica {


    // Operations on datasets and generic ordered sets of numbers

    // The Vector type must have size() and operator[]() methods

    // (e.g. std::vector<real> and vec<real>)


    template<typename Vector, enable_vector<Vector> = true>


    inline auto product(const Vector& X) {


        if(!X.size()) {

            TH_MATH_ERROR("product", X.size(), INVALID_ARGUMENT);

            return vector_element_t<Vector>(nan());

        }


        auto res = X[0];

        for(unsigned int i = 1; i < X.size(); i++)

            res *= X[i];


        return res;

    }


    template<typename Vector>


    inline auto product_sum(const Vector& X, const Vector& Y) {


        if(X.size() != Y.size() || !X.size()) {

            TH_MATH_ERROR("product_sum", X.size(), INVALID_ARGUMENT);

            return nan();

        }


        auto res = X[0] * Y[0];

        for(unsigned int i = 1; i < X.size(); i++)

            res += X[i] * Y[i];


        return res;

    }


    template<typename Vector>


    inline auto product_sum_squares(const Vector& X, const Vector& Y) {


        if(X.size() != Y.size() || !X.size()) {

            TH_MATH_ERROR("product_sum_squares", X.size(), INVALID_ARGUMENT);

            return nan();

        }


        auto res = (X[0] * X[0]) * (Y[0] * Y[0]);


        for(unsigned int i = 1; i < X.size(); i++)

            res += (X[i] * X[i]) * (Y[i] * Y[i]);


        return res;

    }


    template<typename Vector>


    inline auto product_sum(const Vector& X, const Vector& Y, const Vector& Z) {


        if(X.size() != Y.size() || X.size() != Z.size() || !X.size()) {

            TH_MATH_ERROR("product_sum", X.size(), INVALID_ARGUMENT);

            return nan();

        }


        auto res = X[0] * Y[0] * Z[0];

        for(unsigned int i = 1; i < X.size(); i++)

            res += X[i] * Y[i] * Z[i];


        return res;

    }


    template<typename Vector>


    inline auto quotient_sum(const Vector& X, const Vector& Y) {


        if(X.size() != Y.size()) {

            TH_MATH_ERROR("quotient_sum", X.size(), INVALID_ARGUMENT);

            return nan();

        }


        if(abs(Y[0]) < MACH_EPSILON) {

            TH_MATH_ERROR("quotient_sum", Y[0], DIV_BY_ZERO);

            return nan();

        }


        auto res = X[0] / Y[0];

        for(unsigned int i = 1; i < X.size(); i++) {


            if(abs(Y[i]) < MACH_EPSILON) {

                TH_MATH_ERROR("quotient_sum", Y[i], DIV_BY_ZERO);

                return nan();

            }


            res += X[i] / Y[i];

        }


        return res;

    }


    template<typename Vector>


    inline auto sum_squares(const Vector& X) {


        if(!X.size()) {

            TH_MATH_ERROR("sum_squares", X.size(), INVALID_ARGUMENT);

            return nan();

        }


        auto res = X[0] * X[0];

        for(unsigned int i = 1; i < X.size(); i++)

            res += X[i] * X[i];


        return res;

    }


    template<typename Vector>


    inline real sum_compensated(const Vector& X) {


        // Total sum

        real sum = 0;


        // Correction term

        real corr = 0;


        for (unsigned int i = 0; i < X.size(); i++) {


            const real temp = sum + X[i];


            // Sort the two addends to preserve bits

            corr += (abs(sum) >= abs(X[i]))

              ? ((sum - temp) + X[i])

              : ((X[i] - temp) + sum);


            sum = temp;

        }


        // Apply correction

        return sum + corr;

    }


    template<typename Vector>


    inline real sum_pairwise(

        const Vector& X, size_t begin = 0,

        size_t end = 0, size_t base_size = 128) {


        if(end == 0)

            end = X.size();


        real sum = 0;


        // Base case with given size (defaults to 128)

        if((end - begin) <= base_size) {


            for (size_t i = begin; i < end; ++i)

                sum += X[i];


        } else {


            // Recursive sum of two halves

            const size_t m = (end - begin) / 2;

            const size_t cutoff = begin + m;


            sum = sum_pairwise(X, begin, cutoff, base_size)

                + sum_pairwise(X, cutoff, end, base_size);

        }


        return sum;

    }


    template <

        typename Vector,

        std::enable_if_t<has_real_elements<Vector>::value> = true

    >


    inline auto sum(const Vector& X) {

        return sum_pairwise(X);

    }


    template<typename Vector>


    inline auto sum(const Vector& X) {


        // Use pairwise sum to reduce floating point errors.

        if TH_CONSTIF (has_real_elements<Vector>())

            return sum_pairwise(X);


        auto res = X[0];

        for(unsigned int i = 1; i < X.size(); i++)

            res += X[i];


        return res;

    }


    template<typename Vector, typename Function>


    inline Vector& apply(Function f, Vector& X) {


        for (unsigned int i = 0; i < X.size(); i++)

            X[i] = f(X[i]);


        return X;

    }


    template<typename Vector1, typename Vector2 = Vector1, typename Function>


    inline Vector2& map(Function f, const Vector1& src, Vector2& dest) {


        if(src.size() != dest.size()) {

            TH_MATH_ERROR("th::map", dest.size(), INVALID_ARGUMENT);

            dest = Vector2(nan());

            return dest;

        }


        for (unsigned int i = 0; i < src.size(); i++)

            dest[i] = f(src[i]);


        return dest;

    }


    template<typename Vector2, typename Vector1, typename Function>


    inline Vector2 map(Function f, const Vector1& X) {


        Vector2 res;

        res.resize(X.size());


        for (unsigned int i = 0; i < X.size(); i++)

            res[i] = f(X[i]);


        return res;

    }


    template<typename Vector, typename Function>


    inline Vector map(Function f, const Vector& X) {

        return map<Vector, Vector, Function>(f, X);

    }


    template<typename Vector1, typename Vector2, typename Vector3 = Vector1>


    inline Vector3 concatenate(const Vector1& v1, const Vector2& v2) {


        Vector3 res;

        res.resize(v1.size() + v2.size());

        const unsigned int offset = v1.size();


        for (unsigned int i = 0; i < offset; ++i)

            res[i] = v1[i];


        for (unsigned int i = 0; i < v2.size(); ++i)

            res[i + offset] = v2[i];


        return res;

    }


    template<typename Vector>


    inline auto max(const Vector& X) {


        using Type = vector_element_t<Vector>;


        if(!X.size()) {

            TH_MATH_ERROR("max", X.size(), INVALID_ARGUMENT);

            return Type(nan());

        }


        auto curr = X[0];


        for (unsigned int i = 1; i < X.size(); ++i)

            if(X[i] > curr)

                curr = X[i];


        return curr;

    }


    template<typename Vector>


    inline auto min(const Vector& X) {


        using Type = vector_element_t<Vector>;


        if(!X.size()) {

            TH_MATH_ERROR("min", X.size(), INVALID_ARGUMENT);

            return Type(nan());

        }


        auto curr = X[0];


        for (unsigned int i = 1; i < X.size(); ++i)

            if(X[i] < curr)

                curr = X[i];


        return curr;

    }


    // Different types of means


    template<typename Dataset>


    inline real arithmetic_mean(const Dataset& data) {


        if(!data.size()) {

            TH_MATH_ERROR("arithmetic_mean", data.size(), DIV_BY_ZERO);

            return nan();

        }


        // Sum of x_i / N

        return sum(data) / (real) data.size();

    }


    template<typename Dataset>


    inline real harmonic_mean(const Dataset& data) {


        if(!data.size()) {

            TH_MATH_ERROR("harmonic_mean", data.size(), DIV_BY_ZERO);

            return nan();

        }


        real res = 0;


        for (unsigned int i = 0; i < data.size(); ++i) {


            if(data[i] == 0) {

                TH_MATH_ERROR("harmonic_mean", data[i], DIV_BY_ZERO);

                return nan();

            }


            res += 1.0 / data[i];

        }


        return static_cast<real>(data.size()) / res;

    }


    template<typename Dataset>


    inline real geometric_mean(const Dataset& data) {

        return root(product(data), data.size());

    }


    template<typename Dataset1, typename Dataset2>


    inline real weighted_mean(const Dataset1& data, const Dataset2& weights) {


        // Sum of x_i * w_i / Sum of w_i

        return product_sum(data, weights) / sum(weights);

    }


    template<typename Dataset>


    inline real quadratic_mean(const Dataset& data) {


        if(!data.size()) {

            TH_MATH_ERROR("quadratic_mean", data.size(), INVALID_ARGUMENT);

            return nan();

        }


        return sqrt(sum_squares(data) / data.size());

    }


}


#endif

constants.h
Mathematical constants and default algorithm parameters.

TH_CONSTIF
#define TH_CONSTIF
Enable constexpr in if statements if C++17 is supported.
Definition constants.h:169

core_traits.h
Fundamental type traits.

error.h
Error handling.

TH_MATH_ERROR
#define TH_MATH_ERROR(F_NAME, VALUE, EXCEPTION)
TH_MATH_ERROR is a macro which throws exceptions or modifies errno (depending on which compiling opti...
Definition error.h:225

theoretica
Main namespace of the library which contains all functions and objects.
Definition algebra.h:27

theoretica::real
double real
A real number, defined as a floating point type.
Definition constants.h:198

theoretica::weighted_mean
real weighted_mean(const Dataset1 &data, const Dataset2 &weights)
Compute the weighted mean of a set of values <data> and <weights> must have the same size.
Definition dataset.h:423

theoretica::arithmetic_mean
real arithmetic_mean(const Dataset &data)
Compute the arithmetic mean of a set of values.
Definition dataset.h:375

theoretica::min
auto min(const Vector &X)
Finds the minimum value inside a dataset.
Definition dataset.h:351

theoretica::harmonic_mean
real harmonic_mean(const Dataset &data)
Compute the harmonic mean of a set of values.
Definition dataset.h:389

theoretica::sum_compensated
real sum_compensated(const Vector &X)
Compute the sum of a set of values using the compensated Neumaier-Kahan-Babushka summation algorithm ...
Definition dataset.h:148

theoretica::sqrt
dual2 sqrt(dual2 x)
Compute the square root of a second order dual number.
Definition dual2_functions.h:54

theoretica::concatenate
Vector3 concatenate(const Vector1 &v1, const Vector2 &v2)
Concatenate two datasets to form a single one.
Definition dataset.h:312

theoretica::map
Vector2 & map(Function f, const Vector1 &src, Vector2 &dest)
Get a new vector obtained by applying the function element-wise.
Definition dataset.h:266

theoretica::abs
dual2 abs(dual2 x)
Compute the absolute value of a second order dual number.
Definition dual2_functions.h:198

theoretica::sum_pairwise
real sum_pairwise(const Vector &X, size_t begin=0, size_t end=0, size_t base_size=128)
Compute the sum of a set of values using pairwise summation to reduce round-off error.
Definition dataset.h:182

theoretica::sum
auto sum(const Vector &X)
Compute the sum of a vector of real values using pairwise summation to reduce round-off error.
Definition dataset.h:219

theoretica::geometric_mean
real geometric_mean(const Dataset &data)
Compute the geometric mean of a set of values as .
Definition dataset.h:415

theoretica::max
auto max(const Vector &X)
Finds the maximum value inside a dataset.
Definition dataset.h:330

theoretica::product_sum
auto product_sum(const Vector &X, const Vector &Y)
Sum the products of two sets of values.
Definition dataset.h:46

theoretica::product_sum_squares
auto product_sum_squares(const Vector &X, const Vector &Y)
Sum the products of the squares of two sets of data.
Definition dataset.h:63

theoretica::nan
TH_CONSTEXPR real nan()
Return a quiet NaN number in floating point representation.
Definition error.h:54

theoretica::quadratic_mean
real quadratic_mean(const Dataset &data)
Compute the quadratic mean (Root Mean Square) of a set of values .
Definition dataset.h:433

theoretica::quotient_sum
auto quotient_sum(const Vector &X, const Vector &Y)
Sum the quotients of two sets of values.
Definition dataset.h:98

theoretica::MACH_EPSILON
constexpr real MACH_EPSILON
Machine epsilon for the real type.
Definition constants.h:207

theoretica::apply
Vector & apply(Function f, Vector &X)
Apply a function to a set of values element-wise.
Definition dataset.h:250

theoretica::root
real root(real x, int n)
Compute the n-th root of x.
Definition real_analysis.h:812

theoretica::product
auto product(const Vector &X)
Compute the product of a set of values.
Definition dataset.h:29

theoretica::sum_squares
auto sum_squares(const Vector &X)
Sum the squares of a set of values.
Definition dataset.h:127