tatami/convert__to__fragmented__sparse_8hpp_source.html

#ifndef TATAMI_CONVERT_TO_FRAGMENTED_SPARSE_H

#define TATAMI_CONVERT_TO_FRAGMENTED_SPARSE_H


#include "FragmentedSparseMatrix.hpp"

#include "../utils/parallelize.hpp"

#include "../utils/consecutive_extractor.hpp"

#include "../utils/Index_to_container.hpp"


#include <memory>

#include <vector>

#include <cstddef>


namespace tatami {


template<typename Value_, typename Index_>


struct FragmentedSparseContents {

    FragmentedSparseContents(Index_ n) :

        value(cast_Index_to_container_size<decltype(value)>(n)),

        index(cast_Index_to_container_size<decltype(index)>(n))

    {}

    std::vector<std::vector<Value_> > value;


    std::vector<std::vector<Index_> > index;

};


struct RetrieveFragmentedSparseContentsOptions {

    int num_threads = 1;

};


template<typename StoredValue_, typename StoredIndex_, typename InputValue_, typename InputIndex_>


FragmentedSparseContents<StoredValue_, StoredIndex_> retrieve_fragmented_sparse_contents(

    const Matrix<InputValue_, InputIndex_>& matrix,

    bool row,

    const RetrieveFragmentedSparseContentsOptions& options)

{

    InputIndex_ NR = matrix.nrow();

    InputIndex_ NC = matrix.ncol();

    InputIndex_ primary = (row ? NR : NC);

    InputIndex_ secondary = (row ? NC : NR);


    FragmentedSparseContents<StoredValue_, StoredIndex_> output(primary);

    auto& store_v = output.value;

    auto& store_i = output.index;


    if (row == matrix.prefer_rows()) {

        if (matrix.is_sparse()) {

            parallelize([&](int, InputIndex_ start, InputIndex_ length) -> void {

                auto wrk = consecutive_extractor<true>(matrix, row, start, length);

                auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(secondary);

                auto buffer_i = create_container_of_Index_size<std::vector<InputIndex_> >(secondary);


                for (InputIndex_ p = start, pe = start + length; p < pe; ++p) {

                    auto range = wrk->fetch(buffer_v.data(), buffer_i.data());

                    auto& sv = store_v[p];

                    auto& si = store_i[p];

                    sv.reserve(range.number);

                    si.reserve(range.number);


                    for (InputIndex_ i = 0; i < range.number; ++i, ++range.value, ++range.index) {

                        if (*range.value) {

                            sv.push_back(*range.value);

                            si.push_back(*range.index);

                        }

                    }

                }

            }, primary, options.num_threads);


        } else {

            parallelize([&](int, InputIndex_ start, InputIndex_ length) -> void {

                auto wrk = consecutive_extractor<false>(matrix, row, start, length);

                auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(secondary);


                // Special conversion from dense to save ourselves from having to make

                // indices that we aren't really interested in.

                for (InputIndex_ p = start, pe = start + length; p < pe; ++p) {

                    auto ptr = wrk->fetch(buffer_v.data());

                    auto& sv = store_v[p];

                    auto& si = store_i[p];


                    for (InputIndex_ s = 0; s < secondary; ++s, ++ptr) {

                        if (*ptr) {

                            sv.push_back(*ptr);

                            si.push_back(s);

                        }

                    }

                }

            }, primary, options.num_threads);

        }


    } else {

        // We iterate on the matrix matrix's preferred dimension, under the

        // assumption that it may be arbitrarily costly to extract in the

        // non-preferred dim; it is thus cheaper to do cache-unfriendly inserts

        // into the output buffers.


        if (matrix.is_sparse()) {

            parallelize([&](int, InputIndex_ start, InputIndex_ length) -> void {

                auto wrk = consecutive_extractor<true>(matrix, !row, static_cast<InputIndex_>(0), secondary, start, length);

                auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(primary);

                auto buffer_i = create_container_of_Index_size<std::vector<InputIndex_> >(primary);


                for (InputIndex_ x = 0; x < secondary; ++x) {

                    auto range = wrk->fetch(buffer_v.data(), buffer_i.data());

                    for (InputIndex_ i = 0; i < range.number; ++i, ++range.value, ++range.index) {

                        if (*range.value) {

                            store_v[*range.index].push_back(*range.value);

                            store_i[*range.index].push_back(x);

                        }

                    }

                }

            }, primary, options.num_threads);


        } else {

            parallelize([&](int, InputIndex_ start, InputIndex_ length) -> void {

                auto wrk = consecutive_extractor<false>(matrix, !row, static_cast<InputIndex_>(0), secondary, start, length);

                auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(length);


                for (InputIndex_ x = 0; x < secondary; ++x) {

                    auto ptr = wrk->fetch(buffer_v.data());

                    for (InputIndex_ p = start, pe = start + length; p < pe; ++p, ++ptr) {

                        if (*ptr) {

                            store_v[p].push_back(*ptr);

                            store_i[p].push_back(x);

                        }

                    }

                }

            }, primary, options.num_threads);

        }

    }


    return output;

}


struct ConvertToFragmentedSparseOptions {

    int num_threads = 1;

};


template<

    typename Value_,

    typename Index_,

    typename StoredValue_ = Value_,

    typename StoredIndex_ = Index_,

    typename InputValue_,

    typename InputIndex_

>


std::shared_ptr<Matrix<Value_, Index_> > convert_to_fragmented_sparse(

    const Matrix<InputValue_, InputIndex_>& matrix,

    bool row,

    const ConvertToFragmentedSparseOptions& options)

{

    auto frag = retrieve_fragmented_sparse_contents<StoredValue_, StoredIndex_>(

        matrix,

        row,

        [&]{

            RetrieveFragmentedSparseContentsOptions ropt;

            ropt.num_threads = options.num_threads;

            return ropt;

        }()

    );

    return std::shared_ptr<Matrix<Value_, Index_> >(

        new FragmentedSparseMatrix<

            Value_,

            Index_,

            std::vector<std::vector<StoredValue_> >,

            std::vector<std::vector<StoredIndex_> >

        >(

            matrix.nrow(),

            matrix.ncol(),

            std::move(frag.value),

            std::move(frag.index),

            row,

            []{

                FragmentedSparseMatrixOptions fopt;

                fopt.check = false; // no need for checks, as we guarantee correctness.

                return fopt;

            }()

        )

    );

}


// Backwards compatbility.

template<typename Value_, typename Index_, typename StoredValue_ = Value_, typename StoredIndex_ = Index_, typename InputValue_, typename InputIndex_>

std::shared_ptr<Matrix<Value_, Index_> > convert_to_fragmented_sparse(const Matrix<InputValue_, InputIndex_>* matrix, bool row, int threads = 1) {

    return convert_to_fragmented_sparse<Value_, Index_, StoredValue_, StoredIndex_>(

        *matrix,

        row,

        [&]{

            ConvertToFragmentedSparseOptions opt;

            opt.num_threads = threads;

            return opt;

        }()

    );

}


template<typename StoredValue_, typename StoredIndex_, typename InputValue_, typename InputIndex_>

FragmentedSparseContents<StoredValue_, StoredIndex_> retrieve_fragmented_sparse_contents(const Matrix<InputValue_, InputIndex_>* matrix, bool row, int threads = 1) {

    return retrieve_fragmented_sparse_contents<StoredValue_, StoredIndex_>(

        *matrix,

        row,

        [&]{

            RetrieveFragmentedSparseContentsOptions opt;

            opt.num_threads = threads;

            return opt;

        }()

    );

}


template <bool row_, typename StoredValue_, typename StoredIndex_, typename InputValue_, typename InputIndex_>

FragmentedSparseContents<StoredValue_, StoredIndex_> retrieve_fragmented_sparse_contents(const Matrix<InputValue_, InputIndex_>* matrix, int threads = 1) {

    return retrieve_fragmented_sparse_contents<StoredValue_, StoredIndex_>(matrix, row_, threads);

}


template <bool row_, typename Value_, typename Index_, typename StoredValue_ = Value_, typename StoredIndex_ = Index_, typename InputValue_, typename InputIndex_>

std::shared_ptr<Matrix<Value_, Index_> > convert_to_fragmented_sparse(const Matrix<InputValue_, InputIndex_>* matrix, int threads = 1) {

    return convert_to_fragmented_sparse<Value_, Index_, StoredValue_, StoredIndex_>(matrix, row_, threads);

}

}


#endif

FragmentedSparseMatrix.hpp
Fragmented sparse matrix representation.

tatami::FragmentedSparseMatrix
Fragmented sparse matrix representation.
Definition FragmentedSparseMatrix.hpp:467

tatami::Matrix
Virtual class for a matrix.
Definition Matrix.hpp:59

tatami::Matrix::ncol
virtual Index_ ncol() const =0

tatami::Matrix::nrow
virtual Index_ nrow() const =0

tatami::Matrix::prefer_rows
virtual bool prefer_rows() const =0

tatami::Matrix::is_sparse
virtual bool is_sparse() const =0

consecutive_extractor.hpp
Templated construction of a new consecutive extractor.

tatami
Flexible representations for matrix data.
Definition Extractor.hpp:15

tatami::cast_Index_to_container_size
decltype(std::declval< Container_ >().size()) cast_Index_to_container_size(Index_ x)
Definition Index_to_container.hpp:54

tatami::parallelize
void parallelize(Function_ fun, Index_ tasks, int threads)
Definition parallelize.hpp:42

tatami::retrieve_fragmented_sparse_contents
FragmentedSparseContents< StoredValue_, StoredIndex_ > retrieve_fragmented_sparse_contents(const Matrix< InputValue_, InputIndex_ > &matrix, bool row, const RetrieveFragmentedSparseContentsOptions &options)
Definition convert_to_fragmented_sparse.hpp:81

tatami::create_container_of_Index_size
Container_ create_container_of_Index_size(Index_ x, Args_ &&... args)
Definition Index_to_container.hpp:70

tatami::convert_to_fragmented_sparse
std::shared_ptr< Matrix< Value_, Index_ > > convert_to_fragmented_sparse(const Matrix< InputValue_, InputIndex_ > &matrix, bool row, const ConvertToFragmentedSparseOptions &options)
Definition convert_to_fragmented_sparse.hpp:217

tatami::consecutive_extractor
auto consecutive_extractor(const Matrix< Value_, Index_ > &matrix, bool row, Index_ iter_start, Index_ iter_length, Args_ &&... args)
Definition consecutive_extractor.hpp:35

parallelize.hpp
Parallelized iteration over a tatami::Matrix.

tatami::ConvertToFragmentedSparseOptions
Options for convert_to_fragmented_sparse().
Definition convert_to_fragmented_sparse.hpp:187

tatami::ConvertToFragmentedSparseOptions::num_threads
int num_threads
Definition convert_to_fragmented_sparse.hpp:191

tatami::FragmentedSparseContents
Fragmented sparse contents.
Definition convert_to_fragmented_sparse.hpp:32

tatami::FragmentedSparseContents::value
std::vector< std::vector< Value_ > > value
Definition convert_to_fragmented_sparse.hpp:48

tatami::FragmentedSparseContents::index
std::vector< std::vector< Index_ > > index
Definition convert_to_fragmented_sparse.hpp:55

tatami::RetrieveFragmentedSparseContentsOptions
Options for retrieve_fragmented_sparse_contents().
Definition convert_to_fragmented_sparse.hpp:61

tatami::RetrieveFragmentedSparseContentsOptions::num_threads
int num_threads
Definition convert_to_fragmented_sparse.hpp:65