From eda5bc26f44ee9a6f83dcf8c91f17296d7fc509d Mon Sep 17 00:00:00 2001 From: Nao Pross Date: Mon, 12 Feb 2024 14:52:43 +0100 Subject: Move into version control --- .../include/armadillo_bits/spglue_minus_meat.hpp | 340 +++++++++++++++++++++ 1 file changed, 340 insertions(+) create mode 100644 src/armadillo/include/armadillo_bits/spglue_minus_meat.hpp (limited to 'src/armadillo/include/armadillo_bits/spglue_minus_meat.hpp') diff --git a/src/armadillo/include/armadillo_bits/spglue_minus_meat.hpp b/src/armadillo/include/armadillo_bits/spglue_minus_meat.hpp new file mode 100644 index 0000000..1ad7161 --- /dev/null +++ b/src/armadillo/include/armadillo_bits/spglue_minus_meat.hpp @@ -0,0 +1,340 @@ +// SPDX-License-Identifier: Apache-2.0 +// +// Copyright 2008-2016 Conrad Sanderson (http://conradsanderson.id.au) +// Copyright 2008-2016 National ICT Australia (NICTA) +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. +// ------------------------------------------------------------------------ + + +//! \addtogroup spglue_minus +//! @{ + + + +template +inline +void +spglue_minus::apply(SpMat& out, const SpGlue& X) + { + arma_extra_debug_sigprint(); + + typedef typename T1::elem_type eT; + + const SpProxy pa(X.A); + const SpProxy pb(X.B); + + const bool is_alias = pa.is_alias(out) || pb.is_alias(out); + + if(is_alias == false) + { + spglue_minus::apply_noalias(out, pa, pb); + } + else + { + SpMat tmp; + + spglue_minus::apply_noalias(tmp, pa, pb); + + out.steal_mem(tmp); + } + } + + + +template +inline +void +spglue_minus::apply_noalias(SpMat& out, const SpProxy& pa, const SpProxy& pb) + { + arma_extra_debug_sigprint(); + + arma_debug_assert_same_size(pa.get_n_rows(), pa.get_n_cols(), pb.get_n_rows(), pb.get_n_cols(), "subtraction"); + + if(pa.get_n_nonzero() == 0) { out = pb.Q; out *= eT(-1); return; } + if(pb.get_n_nonzero() == 0) { out = pa.Q; return; } + + const uword max_n_nonzero = pa.get_n_nonzero() + pb.get_n_nonzero(); + + // Resize memory to upper bound + out.reserve(pa.get_n_rows(), pa.get_n_cols(), max_n_nonzero); + + // Now iterate across both matrices. + typename SpProxy::const_iterator_type x_it = pa.begin(); + typename SpProxy::const_iterator_type x_end = pa.end(); + + typename SpProxy::const_iterator_type y_it = pb.begin(); + typename SpProxy::const_iterator_type y_end = pb.end(); + + uword count = 0; + + while( (x_it != x_end) || (y_it != y_end) ) + { + eT out_val; + + const uword x_it_row = x_it.row(); + const uword x_it_col = x_it.col(); + + const uword y_it_row = y_it.row(); + const uword y_it_col = y_it.col(); + + bool use_y_loc = false; + + if(x_it == y_it) + { + out_val = (*x_it) - (*y_it); + + ++x_it; + ++y_it; + } + else + { + if((x_it_col < y_it_col) || ((x_it_col == y_it_col) && (x_it_row < y_it_row))) // if y is closer to the end + { + out_val = (*x_it); + + ++x_it; + } + else + { + out_val = -(*y_it); // take the negative + + ++y_it; + + use_y_loc = true; + } + } + + if(out_val != eT(0)) + { + access::rw(out.values[count]) = out_val; + + const uword out_row = (use_y_loc == false) ? x_it_row : y_it_row; + const uword out_col = (use_y_loc == false) ? x_it_col : y_it_col; + + access::rw(out.row_indices[count]) = out_row; + access::rw(out.col_ptrs[out_col + 1])++; + ++count; + } + + arma_check( (count > max_n_nonzero), "internal error: spglue_minus::apply_noalias(): count > max_n_nonzero" ); + } + + const uword out_n_cols = out.n_cols; + + uword* col_ptrs = access::rwp(out.col_ptrs); + + // Fix column pointers to be cumulative. + for(uword c = 1; c <= out_n_cols; ++c) + { + col_ptrs[c] += col_ptrs[c - 1]; + } + + if(count < max_n_nonzero) + { + if(count <= (max_n_nonzero/2)) + { + out.mem_resize(count); + } + else + { + // quick resize without reallocating memory and copying data + access::rw( out.n_nonzero) = count; + access::rw( out.values[count]) = eT(0); + access::rw(out.row_indices[count]) = uword(0); + } + } + } + + + +template +inline +void +spglue_minus::apply_noalias(SpMat& out, const SpMat& A, const SpMat& B) + { + arma_extra_debug_sigprint(); + + const SpProxy< SpMat > pa(A); + const SpProxy< SpMat > pb(B); + + spglue_minus::apply_noalias(out, pa, pb); + } + + + +// + + + +template +inline +void +spglue_minus_mixed::apply(SpMat::eT>& out, const mtSpGlue::eT, T1, T2, spglue_minus_mixed>& expr) + { + arma_extra_debug_sigprint(); + + typedef typename T1::elem_type eT1; + typedef typename T2::elem_type eT2; + + typedef typename promote_type::result out_eT; + + promote_type::check(); + + if( (is_same_type::no) && (is_same_type::yes) ) + { + // upgrade T1 + + const unwrap_spmat UA(expr.A); + const unwrap_spmat UB(expr.B); + + const SpMat& A = UA.M; + const SpMat& B = UB.M; + + SpMat AA(arma_layout_indicator(), A); + + for(uword i=0; i < A.n_nonzero; ++i) { access::rw(AA.values[i]) = out_eT(A.values[i]); } + + const SpMat& BB = reinterpret_cast< const SpMat& >(B); + + out = AA - BB; + } + else + if( (is_same_type::yes) && (is_same_type::no) ) + { + // upgrade T2 + + const unwrap_spmat UA(expr.A); + const unwrap_spmat UB(expr.B); + + const SpMat& A = UA.M; + const SpMat& B = UB.M; + + const SpMat& AA = reinterpret_cast< const SpMat& >(A); + + SpMat BB(arma_layout_indicator(), B); + + for(uword i=0; i < B.n_nonzero; ++i) { access::rw(BB.values[i]) = out_eT(B.values[i]); } + + out = AA - BB; + } + else + { + // upgrade T1 and T2 + + const unwrap_spmat UA(expr.A); + const unwrap_spmat UB(expr.B); + + const SpMat& A = UA.M; + const SpMat& B = UB.M; + + SpMat AA(arma_layout_indicator(), A); + SpMat BB(arma_layout_indicator(), B); + + for(uword i=0; i < A.n_nonzero; ++i) { access::rw(AA.values[i]) = out_eT(A.values[i]); } + for(uword i=0; i < B.n_nonzero; ++i) { access::rw(BB.values[i]) = out_eT(B.values[i]); } + + out = AA - BB; + } + } + + + +template +inline +void +spglue_minus_mixed::sparse_minus_dense(Mat< typename promote_type::result>& out, const T1& X, const T2& Y) + { + arma_extra_debug_sigprint(); + + typedef typename T1::elem_type eT1; + typedef typename T2::elem_type eT2; + + typedef typename promote_type::result out_eT; + + promote_type::check(); + + const quasi_unwrap UB(Y); + const Mat& B = UB.M; + + const uword B_n_elem = B.n_elem; + const eT2* B_mem = B.memptr(); + + out.set_size(B.n_rows, B.n_cols); + + out_eT* out_mem = out.memptr(); + + for(uword i=0; i pa(X); + + arma_debug_assert_same_size( pa.get_n_rows(), pa.get_n_cols(), out.n_rows, out.n_cols, "subtraction" ); + + typename SpProxy::const_iterator_type it = pa.begin(); + typename SpProxy::const_iterator_type it_end = pa.end(); + + while(it != it_end) + { + out.at(it.row(), it.col()) += out_eT(*it); + ++it; + } + } + + + +template +inline +void +spglue_minus_mixed::dense_minus_sparse(Mat< typename promote_type::result>& out, const T1& X, const T2& Y) + { + arma_extra_debug_sigprint(); + + typedef typename T1::elem_type eT1; + typedef typename T2::elem_type eT2; + + typedef typename promote_type::result out_eT; + + promote_type::check(); + + if(is_same_type::no) + { + out = conv_to< Mat >::from(X); + } + else + { + const quasi_unwrap UA(X); + + const Mat& A = UA.M; + + out = reinterpret_cast< const Mat& >(A); + } + + const SpProxy pb(Y); + + arma_debug_assert_same_size( out.n_rows, out.n_cols, pb.get_n_rows(), pb.get_n_cols(), "subtraction" ); + + typename SpProxy::const_iterator_type it = pb.begin(); + typename SpProxy::const_iterator_type it_end = pb.end(); + + while(it != it_end) + { + out.at(it.row(), it.col()) -= out_eT(*it); + ++it; + } + } + + + +//! @} -- cgit v1.2.1