tatami/convert__to__compressed__sparse_8hpp_source.html

#ifndef TATAMI_CONVERT_TO_COMPRESSED_SPARSE_H

#define TATAMI_CONVERT_TO_COMPRESSED_SPARSE_H


#include <memory>

#include <vector>

#include <cstddef>


#include "CompressedSparseMatrix.hpp"

#include "convert_to_fragmented_sparse.hpp"

#include "../utils/parallelize.hpp"

#include "../utils/consecutive_extractor.hpp"

#include "../utils/Index_to_container.hpp"

#include "../utils/copy.hpp"


namespace tatami {


namespace convert_to_compressed_sparse_internal {


template<typename Value_, typename Index_, typename Count_>

void count_compressed_sparse_non_zeros_consistent(

    const tatami::Matrix<Value_, Index_>& matrix,

    const Index_ primary,

    const Index_ secondary,

    const bool row,

    Count_* const output,

    const int threads)

{

    if (matrix.is_sparse()) {

        Options opt;

        opt.sparse_extract_value = false;

        opt.sparse_extract_index = false;

        opt.sparse_ordered_index = false;


        parallelize([&](const int, const Index_ start, const Index_ length) -> void {

            auto wrk = consecutive_extractor<true>(matrix, row, start, length, opt);

            for (Index_ x = 0; x < length; ++x) {

                const auto range = wrk->fetch(NULL, NULL);

                output[start + x] = range.number;

            }

        }, primary, threads);


    } else {

        parallelize([&](const int, const Index_ start, const Index_ length) -> void {

            auto buffer_v = create_container_of_Index_size<std::vector<Value_> >(secondary);

            auto wrk = consecutive_extractor<false>(matrix, row, start, length);

            for (Index_ p = start, pe = start + length; p < pe; ++p) {

                const auto ptr = wrk->fetch(buffer_v.data());

                Count_ count = 0;

                for (Index_ s = 0; s < secondary; ++s) {

                    count += (ptr[s] != 0);

                }

                output[p] = count;

            }

        }, primary, threads);

    }

}


template<typename Value_, typename Index_, typename Count_>

void count_compressed_sparse_non_zeros_inconsistent(

    const tatami::Matrix<Value_, Index_>& matrix,

    const Index_ primary,

    const Index_ secondary,

    const bool row,

    Count_* const output,

    const int threads

) {

    auto nz_counts = sanisizer::create<std::vector<std::vector<Count_> > >(threads - 1);

    for (auto& x : nz_counts) {

        x.resize(primary);

    }


    if (matrix.is_sparse()) {

        Options opt;

        opt.sparse_extract_value = false;

        opt.sparse_ordered_index = false;


        parallelize([&](const int t, const Index_ start, const Index_ length) -> void {

            auto wrk = consecutive_extractor<true>(matrix, !row, start, length, opt);

            auto buffer_i = create_container_of_Index_size<std::vector<Index_> >(primary);

            const auto my_counts = (t > 0 ? nz_counts[t - 1].data() : output);


            for (Index_ x = 0; x < length; ++x) {

                const auto range = wrk->fetch(NULL, buffer_i.data());

                for (Index_ i = 0; i < range.number; ++i) {

                    ++my_counts[range.index[i]];

                }

            }

        }, secondary, threads);


    } else {

        parallelize([&](const int t, const Index_ start, const Index_ length) -> void {

            auto wrk = consecutive_extractor<false>(matrix, !row, start, length);

            auto buffer_v = create_container_of_Index_size<std::vector<Value_> >(primary);

            const auto my_counts = (t > 0 ? nz_counts[t - 1].data() : output);


            for (Index_ x = 0; x < length; ++x) {

                const auto ptr = wrk->fetch(buffer_v.data());

                for (Index_ p = 0; p < primary; ++p) {

                    my_counts[p] += (ptr[p] != 0);

                }

            }

        }, secondary, threads);

    }


    for (auto& y : nz_counts) {

        for (Index_ p = 0; p < primary; ++p) {

            output[p] += y[p];

        }

    }

}


template<typename InputValue_, typename InputIndex_, typename Pointer_, typename StoredValue_, typename StoredIndex_>

void fill_compressed_sparse_matrix_consistent(

    const tatami::Matrix<InputValue_, InputIndex_>& matrix,

    const InputIndex_ primary,

    const InputIndex_ secondary,

    const bool row,

    const Pointer_* const pointers,

    StoredValue_* const output_value,

    StoredIndex_* const output_index,

    const int threads)

{

    if (matrix.is_sparse()) {

        Options opt;

        opt.sparse_ordered_index = false;


        parallelize([&](const int, const InputIndex_ start, const InputIndex_ length) -> void {

            auto wrk = consecutive_extractor<true>(matrix, row, start, length, opt);

            auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(secondary);

            auto buffer_i = create_container_of_Index_size<std::vector<InputIndex_> >(secondary);


            for (InputIndex_ p = start, pe = start + length; p < pe; ++p) {

                // Resist the urge to `fetch()` straight into 'output_v'

                // and 'output_i', as implementations may assume that they

                // have the entire 'length' length to play with, and the

                // output vectors only have whatever is allocated from the

                // first pass (which might be nothing for an all-zero matrix).

                const auto range = wrk->fetch(buffer_v.data(), buffer_i.data());

                const auto offset = pointers[p];

                std::copy_n(range.value, range.number, output_value + offset);

                std::copy_n(range.index, range.number, output_index + offset);

            }

        }, primary, threads);


    } else {

        parallelize([&](const int, const InputIndex_ start, const InputIndex_ length) -> void {

            auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(secondary);

            auto wrk = consecutive_extractor<false>(matrix, row, start, length);


            for (InputIndex_ p = start, pe = start + length; p < pe; ++p) {

                const auto ptr = wrk->fetch(buffer_v.data());

                auto offset = pointers[p];

                for (InputIndex_ s = 0; s < secondary; ++s) {

                    const auto val = ptr[s];

                    if (val != 0) {

                        output_value[offset] = val;

                        output_index[offset] = s;

                        ++offset;

                    }

                }

            }

        }, primary, threads);

    }

}


template<typename InputValue_, typename InputIndex_, typename Pointer_, typename StoredValue_, typename StoredIndex_>

void fill_compressed_sparse_matrix_inconsistent(

    const tatami::Matrix<InputValue_, InputIndex_>& matrix,

    const InputIndex_ primary,

    const InputIndex_ secondary,

    const bool row,

    const Pointer_* const pointers,

    StoredValue_* const output_value,

    StoredIndex_* const output_index,

    const int threads)

{

    if (matrix.is_sparse()) {

        Options opt;

        opt.sparse_ordered_index = false;


        parallelize([&](const int, const InputIndex_ start, const InputIndex_ length) -> void {

            auto wrk = consecutive_extractor<true>(matrix, !row, static_cast<InputIndex_>(0), secondary, start, length, opt);

            auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(length);

            auto buffer_i = create_container_of_Index_size<std::vector<InputIndex_> >(length);

            std::vector<Pointer_> offset_copy(pointers + start, pointers + start + length);


            for (InputIndex_ x = 0; x < secondary; ++x) {

                const auto range = wrk->fetch(buffer_v.data(), buffer_i.data());

                for (InputIndex_ i = 0; i < range.number; ++i) {

                    auto& pos = offset_copy[range.index[i] - start];

                    output_value[pos] = range.value[i];

                    output_index[pos] = x;

                    ++pos;

                }

            }

        }, primary, threads);


    } else {

        parallelize([&](const int, const InputIndex_ start, const InputIndex_ length) -> void {

            auto wrk = consecutive_extractor<false>(matrix, !row, static_cast<InputIndex_>(0), secondary, start, length);

            auto buffer_v = create_container_of_Index_size<std::vector<InputValue_> >(length);

            std::vector<Pointer_> offset_copy(pointers + start, pointers + start + length);


            for (InputIndex_ x = 0; x < secondary; ++x) {

                const auto ptr = wrk->fetch(buffer_v.data());

                for (InputIndex_ p = 0; p < length; ++p) {

                    const auto val = ptr[p];

                    if (val != 0) {

                        auto& pos = offset_copy[p];

                        output_value[pos] = val;

                        output_index[pos] = x;

                        ++pos;

                    }

                }

            }

        }, primary, threads);

    }

}


}


struct CountCompressedSparseNonZerosOptions {

    int num_threads = 1;

};


template<typename Value_, typename Index_, typename Count_>


void count_compressed_sparse_non_zeros(

    const tatami::Matrix<Value_, Index_>& matrix,

    const bool row,

    Count_* const output,

    const CountCompressedSparseNonZerosOptions& options

) {

    const Index_ NR = matrix.nrow();

    const Index_ NC = matrix.ncol();

    const Index_ primary = (row ? NR : NC);

    const Index_ secondary = (row ? NC : NR);

    std::fill_n(output, primary, 0);


    if (row == matrix.prefer_rows()) {

        convert_to_compressed_sparse_internal::count_compressed_sparse_non_zeros_consistent(matrix, primary, secondary, row, output, options.num_threads);

    } else {

        convert_to_compressed_sparse_internal::count_compressed_sparse_non_zeros_inconsistent(matrix, primary, secondary, row, output, options.num_threads);

    }

}


struct FillCompressedSparseContentsOptions {

    int num_threads = 1;

};


template<typename InputValue_, typename InputIndex_, typename Pointer_, typename StoredValue_, typename StoredIndex_>


void fill_compressed_sparse_contents(

    const tatami::Matrix<InputValue_, InputIndex_>& matrix,

    const bool row,

    const Pointer_* const pointers,

    StoredValue_* const output_value,

    StoredIndex_* const output_index,

    const FillCompressedSparseContentsOptions& options

) {

    const InputIndex_ NR = matrix.nrow();

    const InputIndex_ NC = matrix.ncol();

    const InputIndex_ primary = (row ? NR : NC);

    const InputIndex_ secondary = (row ? NC : NR);


    if (row == matrix.prefer_rows()) {

        convert_to_compressed_sparse_internal::fill_compressed_sparse_matrix_consistent(matrix, primary, secondary, row, pointers, output_value, output_index, options.num_threads);

    } else {

        convert_to_compressed_sparse_internal::fill_compressed_sparse_matrix_inconsistent(matrix, primary, secondary, row, pointers, output_value, output_index, options.num_threads);

    }

}


template<typename Value_, typename Index_, typename Pointer_>


struct CompressedSparseContents {

    std::vector<Value_> value;


    std::vector<Index_> index;


    std::vector<Pointer_> pointers;

};


struct RetrieveCompressedSparseContentsOptions {

    bool two_pass = false;


    int num_threads = 1;

};


template<typename StoredValue_, typename StoredIndex_, typename StoredPointer_ = std::size_t, typename InputValue_, typename InputIndex_>


CompressedSparseContents<StoredValue_, StoredIndex_, StoredPointer_> retrieve_compressed_sparse_contents(

    const Matrix<InputValue_, InputIndex_>& matrix,

    const bool row,

    const RetrieveCompressedSparseContentsOptions& options)

{

    // We use size_t as the default pointer type here, as our output consists of vectors

    // with the default allocator, for which the size_type is unlikely to be bigger than size_t.

    CompressedSparseContents<StoredValue_, StoredIndex_, StoredPointer_> output;

    auto& output_v = output.value;

    auto& output_i = output.index;

    auto& output_p = output.pointers;


    const InputIndex_ NR = matrix.nrow();

    const InputIndex_ NC = matrix.ncol();

    const InputIndex_ primary = (row ? NR : NC);

    const InputIndex_ secondary = (row ? NC : NR);


    output_p.resize(sanisizer::sum<I<decltype(output_p.size())> >(primary, 1));


    if (!options.two_pass) {

        // Doing a single fragmented run and then concatenating everything together.

        const auto frag = retrieve_fragmented_sparse_contents<InputValue_, InputIndex_>(

            matrix,

            row,

            [&]{

                RetrieveFragmentedSparseContentsOptions roptions;

                roptions.num_threads = options.num_threads;

                return roptions;

            }()

        );

        const auto& store_v = frag.value;

        const auto& store_i = frag.index;


        for (InputIndex_ p = 0; p < primary; ++p) {

            output_p[p + 1] = output_p[p] + store_v[p].size();

        }


        output_v.reserve(output_p.back());

        output_i.reserve(output_p.back());

        for (InputIndex_ p = 0; p < primary; ++p) {

            output_v.insert(output_v.end(), store_v[p].begin(), store_v[p].end());

            output_i.insert(output_i.end(), store_i[p].begin(), store_i[p].end());

        }


    } else if (row == matrix.prefer_rows()) {

        // First pass to figure out how many non-zeros there are.

        convert_to_compressed_sparse_internal::count_compressed_sparse_non_zeros_consistent(matrix, primary, secondary, row, output_p.data() + 1, options.num_threads);

        for (InputIndex_ i = 1; i <= primary; ++i) {

            output_p[i] += output_p[i - 1];

        }


        // Second pass to actually fill our vectors.

        output_v.resize(output_p.back());

        output_i.resize(output_p.back());

        convert_to_compressed_sparse_internal::fill_compressed_sparse_matrix_consistent(

            matrix,

            primary,

            secondary,

            row,

            output_p.data(),

            output_v.data(),

            output_i.data(),

            options.num_threads

        );


    } else {

        // First pass to figure out how many non-zeros there are.

        convert_to_compressed_sparse_internal::count_compressed_sparse_non_zeros_inconsistent(matrix, primary, secondary, row, output_p.data() + 1, options.num_threads);

        for (InputIndex_ i = 1; i <= primary; ++i) {

            output_p[i] += output_p[i - 1];

        }


        // Second pass to actually fill our vectors.

        output_v.resize(output_p.back());

        output_i.resize(output_p.back());

        convert_to_compressed_sparse_internal::fill_compressed_sparse_matrix_inconsistent(

            matrix,

            primary,

            secondary,

            row,

            output_p.data(),

            output_v.data(),

            output_i.data(),

            options.num_threads

        );

    }


    return output;

}


struct ConvertToCompressedSparseOptions {

    bool two_pass = false;


    int num_threads = 1;

};


template<

    typename Value_,

    typename Index_,

    typename StoredValue_ = Value_,

    typename StoredIndex_ = Index_,

    typename StoredPointer_ = std::size_t,

    typename InputValue_,

    typename InputIndex_

>


std::shared_ptr<Matrix<Value_, Index_> > convert_to_compressed_sparse(

    const Matrix<InputValue_, InputIndex_>& matrix,

    const bool row,

    const ConvertToCompressedSparseOptions& options

) {

    auto comp = retrieve_compressed_sparse_contents<StoredValue_, StoredIndex_, StoredPointer_>(

        matrix,

        row,

        [&]{

            RetrieveCompressedSparseContentsOptions ropt;

            ropt.two_pass = options.two_pass;

            ropt.num_threads = options.num_threads;

            return ropt;

        }()

    );

    return std::shared_ptr<Matrix<Value_, Index_> >(

        new CompressedSparseMatrix<

            Value_,

            Index_,

            std::vector<StoredValue_>,

            std::vector<StoredIndex_>,

            std::vector<StoredPointer_>

        >(

            matrix.nrow(),

            matrix.ncol(),

            std::move(comp.value),

            std::move(comp.index),

            std::move(comp.pointers),

            row,

            []{

                CompressedSparseMatrixOptions copt;

                copt.check = false; // no need for checks, as we guarantee correctness.

                return copt;

            }()

        )

    );

}


// Backwards compatbility.

template<typename Value_, typename Index_, typename Count_>

void count_compressed_sparse_non_zeros(const tatami::Matrix<Value_, Index_>* matrix, bool row, Count_* output, int threads) {

    return count_compressed_sparse_non_zeros(

        *matrix,

        row,

        output,

        [&]{

            CountCompressedSparseNonZerosOptions copt;

            copt.num_threads = threads;

            return copt;

        }()

    );

}


template<typename InputValue_, typename InputIndex_, typename Pointer_, typename StoredValue_, typename StoredIndex_>

void fill_compressed_sparse_contents(const tatami::Matrix<InputValue_, InputIndex_>* matrix,

    bool row,

    const Pointer_* pointers,

    StoredValue_* output_value,

    StoredIndex_* output_index,

    int threads)

{

    fill_compressed_sparse_contents(

        *matrix,

        row,

        pointers,

        output_value,

        output_index,

        [&]{

            FillCompressedSparseContentsOptions fopt;

            fopt.num_threads = threads;

            return fopt;

        }()

    );

}


template<typename StoredValue_, typename StoredIndex_, typename StoredPointer_ = std::size_t, typename InputValue_, typename InputIndex_>

CompressedSparseContents<StoredValue_, StoredIndex_, StoredPointer_> retrieve_compressed_sparse_contents(const Matrix<InputValue_, InputIndex_>* matrix, bool row, bool two_pass, int threads = 1) {

    return retrieve_compressed_sparse_contents<StoredValue_, StoredIndex_>(

        *matrix,

        row,

        [&]{

            RetrieveCompressedSparseContentsOptions opt;

            opt.two_pass = two_pass;

            opt.num_threads = threads;

            return opt;

        }()

    );

}


template<typename Value_ = double, typename Index_ = int, typename StoredValue_ = Value_, typename StoredIndex_ = Index_, typename InputValue_, typename InputIndex_>

std::shared_ptr<Matrix<Value_, Index_> > convert_to_compressed_sparse(const Matrix<InputValue_, InputIndex_>* matrix, bool row, bool two_pass = false, int threads = 1) {

    return convert_to_compressed_sparse<Value_, Index_, StoredValue_, StoredIndex_>(

        *matrix,

        row,

        [&]{

            ConvertToCompressedSparseOptions opt;

            opt.two_pass = two_pass;

            opt.num_threads = threads;

            return opt;

        }()

    );

}


template <bool row_, typename Value_, typename Index_, typename InputValue_, typename InputIndex_>

CompressedSparseContents<Value_, Index_, std::size_t> retrieve_compressed_sparse_contents(const Matrix<InputValue_, InputIndex_>* matrix, bool two_pass, int threads = 1) {

    return retrieve_compressed_sparse_contents<Value_, Index_>(matrix, row_, two_pass, threads);

}


template <bool row_, typename Value_, typename Index_, typename StoredValue_ = Value_, typename StoredIndex_ = Index_, typename InputValue_, typename InputIndex_>

std::shared_ptr<Matrix<Value_, Index_> > convert_to_compressed_sparse(const Matrix<InputValue_, InputIndex_>* matrix, bool two_pass = false, int threads = 1) {

    return convert_to_compressed_sparse<Value_, Index_, StoredValue_, StoredIndex_>(matrix, row_, two_pass, threads);

}

}


#endif

CompressedSparseMatrix.hpp
Compressed sparse matrix representation.

tatami::CompressedSparseMatrix
Compressed sparse matrix representation.
Definition CompressedSparseMatrix.hpp:581

tatami::Matrix
Virtual class for a matrix.
Definition Matrix.hpp:59

tatami::Matrix::ncol
virtual Index_ ncol() const =0

tatami::Matrix::nrow
virtual Index_ nrow() const =0

tatami::Matrix::prefer_rows
virtual bool prefer_rows() const =0

tatami::Matrix::is_sparse
virtual bool is_sparse() const =0

consecutive_extractor.hpp
Templated construction of a new consecutive extractor.

convert_to_fragmented_sparse.hpp
Convert a matrix into a fragmented sparse format.

copy.hpp
Copy data from one buffer to another.

tatami
Flexible representations for matrix data.
Definition Extractor.hpp:15

tatami::count_compressed_sparse_non_zeros
void count_compressed_sparse_non_zeros(const tatami::Matrix< Value_, Index_ > &matrix, const bool row, Count_ *const output, const CountCompressedSparseNonZerosOptions &options)
Definition convert_to_compressed_sparse.hpp:260

tatami::parallelize
void parallelize(Function_ fun, const Index_ tasks, const int threads)
Definition parallelize.hpp:42

tatami::retrieve_fragmented_sparse_contents
FragmentedSparseContents< StoredValue_, StoredIndex_ > retrieve_fragmented_sparse_contents(const Matrix< InputValue_, InputIndex_ > &matrix, const bool row, const RetrieveFragmentedSparseContentsOptions &options)
Definition convert_to_fragmented_sparse.hpp:82

tatami::retrieve_compressed_sparse_contents
CompressedSparseContents< StoredValue_, StoredIndex_, StoredPointer_ > retrieve_compressed_sparse_contents(const Matrix< InputValue_, InputIndex_ > &matrix, const bool row, const RetrieveCompressedSparseContentsOptions &options)
Definition convert_to_compressed_sparse.hpp:391

tatami::fill_compressed_sparse_contents
void fill_compressed_sparse_contents(const tatami::Matrix< InputValue_, InputIndex_ > &matrix, const bool row, const Pointer_ *const pointers, StoredValue_ *const output_value, StoredIndex_ *const output_index, const FillCompressedSparseContentsOptions &options)
Definition convert_to_compressed_sparse.hpp:309

tatami::convert_to_compressed_sparse
std::shared_ptr< Matrix< Value_, Index_ > > convert_to_compressed_sparse(const Matrix< InputValue_, InputIndex_ > &matrix, const bool row, const ConvertToCompressedSparseOptions &options)
Definition convert_to_compressed_sparse.hpp:523

parallelize.hpp
Parallelized iteration over a tatami::Matrix.

tatami::CompressedSparseContents
Compressed sparse contents.
Definition convert_to_compressed_sparse.hpp:340

tatami::CompressedSparseContents::index
std::vector< Index_ > index
Definition convert_to_compressed_sparse.hpp:349

tatami::CompressedSparseContents::value
std::vector< Value_ > value
Definition convert_to_compressed_sparse.hpp:344

tatami::CompressedSparseContents::pointers
std::vector< Pointer_ > pointers
Definition convert_to_compressed_sparse.hpp:354

tatami::ConvertToCompressedSparseOptions
Options for convert_to_compressed_sparse().
Definition convert_to_compressed_sparse.hpp:484

tatami::ConvertToCompressedSparseOptions::two_pass
bool two_pass
Definition convert_to_compressed_sparse.hpp:489

tatami::ConvertToCompressedSparseOptions::num_threads
int num_threads
Definition convert_to_compressed_sparse.hpp:494

tatami::CountCompressedSparseNonZerosOptions
Options for count_compressed_sparse_non_zeros().
Definition convert_to_compressed_sparse.hpp:237

tatami::CountCompressedSparseNonZerosOptions::num_threads
int num_threads
Definition convert_to_compressed_sparse.hpp:241

tatami::FillCompressedSparseContentsOptions
Options for fill_compressed_sparse_contents().
Definition convert_to_compressed_sparse.hpp:282

tatami::FillCompressedSparseContentsOptions::num_threads
int num_threads
Definition convert_to_compressed_sparse.hpp:286

tatami::RetrieveCompressedSparseContentsOptions
Options for retrieve_compressed_sparse_contents().
Definition convert_to_compressed_sparse.hpp:360

tatami::RetrieveCompressedSparseContentsOptions::num_threads
int num_threads
Definition convert_to_compressed_sparse.hpp:370

tatami::RetrieveCompressedSparseContentsOptions::two_pass
bool two_pass
Definition convert_to_compressed_sparse.hpp:365

tatami::RetrieveFragmentedSparseContentsOptions
Options for retrieve_fragmented_sparse_contents().
Definition convert_to_fragmented_sparse.hpp:62

tatami::RetrieveFragmentedSparseContentsOptions::num_threads
int num_threads
Definition convert_to_fragmented_sparse.hpp:66