nalgebra/nalgebra-sparse/src/ops/serial/csr.rs

use crate::csr::CsrMatrix;
use crate::ops::{Op};
use crate::SparseEntryMut;
use crate::ops::serial::{OperationError, OperationErrorType};
use nalgebra::{Scalar, DMatrixSlice, ClosedAdd, ClosedMul, DMatrixSliceMut};
use num_traits::{Zero, One};
use std::sync::Arc;
use std::borrow::Cow;

/// Sparse-dense matrix-matrix multiplication `C <- beta * C + alpha * op(A) * op(B)`.
pub fn spmm_csr_dense<'a, T>(beta: T,
                             c: impl Into<DMatrixSliceMut<'a, T>>,
                             alpha: T,
                             a: Op<&CsrMatrix<T>>,
                             b: Op<impl Into<DMatrixSlice<'a, T>>>)
    where
        T: Scalar + ClosedAdd + ClosedMul + Zero + One
{
    let b = b.convert();
    spmm_csr_dense_(beta, c.into(), alpha, a, b)
}

fn spmm_csr_dense_<T>(beta: T,
                      mut c: DMatrixSliceMut<T>,
                      alpha: T,
                      a: Op<&CsrMatrix<T>>,
                      b: Op<DMatrixSlice<T>>)
where
    T: Scalar + ClosedAdd + ClosedMul + Zero + One
{
    assert_compatible_spmm_dims!(c, a, b);

    match a {
        Op::Transpose(ref a) => {
            // In this case, we have to pre-multiply C by beta
            c *= beta;

            for k in 0..a.nrows() {
                let a_row_k = a.row(k);
                for (&i, a_ki) in a_row_k.col_indices().iter().zip(a_row_k.values()) {
                    let gamma_ki = alpha.inlined_clone() * a_ki.inlined_clone();
                    let mut c_row_i = c.row_mut(i);
                    match b {
                        Op::NoOp(ref b) => {
                            let b_row_k = b.row(k);
                            for (c_ij, b_kj) in c_row_i.iter_mut().zip(b_row_k.iter()) {
                                *c_ij += gamma_ki.inlined_clone() * b_kj.inlined_clone();
                            }
                        },
                        Op::Transpose(ref b) => {
                            let b_col_k = b.column(k);
                            for (c_ij, b_jk) in c_row_i.iter_mut().zip(b_col_k.iter()) {
                                *c_ij += gamma_ki.inlined_clone() * b_jk.inlined_clone();
                            }
                        },
                    }
                }
            }
        },
        Op::NoOp(ref a) => {
            for j in 0..c.ncols() {
                let mut c_col_j = c.column_mut(j);
                for (c_ij, a_row_i) in c_col_j.iter_mut().zip(a.row_iter()) {
                    let mut dot_ij = T::zero();
                    for (&k, a_ik) in a_row_i.col_indices().iter().zip(a_row_i.values()) {
                        let b_contrib =
                        match b {
                            Op::NoOp(ref b) => b.index((k, j)),
                            Op::Transpose(ref b) => b.index((j, k))
                        };
                        dot_ij += a_ik.inlined_clone() * b_contrib.inlined_clone();
                    }
                    *c_ij = beta.inlined_clone() * c_ij.inlined_clone() + alpha.inlined_clone() * dot_ij;
                }
            }
        }
    }
}

fn spadd_csr_unexpected_entry() -> OperationError {
    OperationError::from_type_and_message(
        OperationErrorType::InvalidPattern,
        String::from("Found entry in `a` that is not present in `c`."))
}

/// Sparse matrix addition `C <- beta * C + alpha * op(A)`.
///
/// If the pattern of `c` does not accommodate all the non-zero entries in `a`, an error is
/// returned.
pub fn spadd_csr<T>(beta: T,
                    c: &mut CsrMatrix<T>,
                    alpha: T,
                    a: Op<&CsrMatrix<T>>)
    -> Result<(), OperationError>
where
    T: Scalar + ClosedAdd + ClosedMul + Zero + One
{
    assert_compatible_spadd_dims!(c, a);

    // TODO: Change CsrMatrix::pattern() to return `&Arc` instead of `Arc`
    if Arc::ptr_eq(&c.pattern(), &a.inner_ref().pattern()) {
        // Special fast path: The two matrices have *exactly* the same sparsity pattern,
        // so we only need to sum the value arrays
        for (c_ij, a_ij) in c.values_mut().iter_mut().zip(a.inner_ref().values()) {
            let (alpha, beta) = (alpha.inlined_clone(), beta.inlined_clone());
            *c_ij = beta * c_ij.inlined_clone() + alpha * a_ij.inlined_clone();
        }
        Ok(())
    } else {
        if let Op::Transpose(a) = a
        {
            if beta != T::one() {
                for c_ij in c.values_mut() {
                    *c_ij *= beta.inlined_clone();
                }
            }

            for (i, a_row_i) in a.row_iter().enumerate() {
                for (&j, a_val) in a_row_i.col_indices().iter().zip(a_row_i.values()) {
                    let a_val = a_val.inlined_clone();
                    let alpha = alpha.inlined_clone();
                    match c.index_entry_mut(j, i) {
                        SparseEntryMut::NonZero(c_ji) => { *c_ji += alpha * a_val }
                        SparseEntryMut::Zero => return Err(spadd_csr_unexpected_entry()),
                    }
                }
            }
        } else if let Op::NoOp(a) = a {
            for (mut c_row_i, a_row_i) in c.row_iter_mut().zip(a.row_iter()) {
                if beta != T::one() {
                    for c_ij in c_row_i.values_mut() {
                        *c_ij *= beta.inlined_clone();
                    }
                }

                let (mut c_cols, mut c_vals) = c_row_i.cols_and_values_mut();
                let (a_cols, a_vals) = (a_row_i.col_indices(), a_row_i.values());

                for (a_col, a_val) in a_cols.iter().zip(a_vals) {
                    // TODO: Use exponential search instead of linear search.
                    // If C has substantially more entries in the row than A, then a line search
                    // will needlessly visit many entries in C.
                    let (c_idx, _) = c_cols.iter()
                        .enumerate()
                        .find(|(_, c_col)| *c_col == a_col)
                        .ok_or_else(spadd_csr_unexpected_entry)?;
                    c_vals[c_idx] += alpha.inlined_clone() * a_val.inlined_clone();
                    c_cols = &c_cols[c_idx ..];
                    c_vals = &mut c_vals[c_idx ..];
                }
            }
        }
        Ok(())
    }
}

fn spmm_csr_unexpected_entry() -> OperationError {
    OperationError::from_type_and_message(
        OperationErrorType::InvalidPattern,
        String::from("Found unexpected entry that is not present in `c`."))
}

/// Sparse-sparse matrix multiplication, `C <- beta * C + alpha * op(A) * op(B)`.
pub fn spmm_csr<T>(
    beta: T,
    c: &mut CsrMatrix<T>,
    alpha: T,
    a: Op<&CsrMatrix<T>>,
    b: Op<&CsrMatrix<T>>)
-> Result<(), OperationError>
where
    T: Scalar + ClosedAdd + ClosedMul + Zero + One
{
    assert_compatible_spmm_dims!(c, a, b);

    use Op::{NoOp, Transpose};

    match (&a, &b) {
        (NoOp(ref a), NoOp(ref b)) => {
            for (mut c_row_i, a_row_i) in c.row_iter_mut().zip(a.row_iter()) {
                for c_ij in c_row_i.values_mut() {
                    *c_ij = beta.inlined_clone() * c_ij.inlined_clone();
                }

                for (&k, a_ik) in a_row_i.col_indices().iter().zip(a_row_i.values()) {
                    let b_row_k = b.row(k);
                    let (mut c_row_i_cols, mut c_row_i_values) = c_row_i.cols_and_values_mut();
                    let alpha_aik = alpha.inlined_clone() * a_ik.inlined_clone();
                    for (j, b_kj) in b_row_k.col_indices().iter().zip(b_row_k.values()) {
                        // Determine the location in C to append the value
                        let (c_local_idx, _) = c_row_i_cols.iter()
                            .enumerate()
                            .find(|(_, c_col)| *c_col == j)
                            .ok_or_else(spmm_csr_unexpected_entry)?;

                        c_row_i_values[c_local_idx] += alpha_aik.inlined_clone() * b_kj.inlined_clone();
                        c_row_i_cols = &c_row_i_cols[c_local_idx ..];
                        c_row_i_values = &mut c_row_i_values[c_local_idx ..];
                    }
                }
            }
            Ok(())
        },
        _ => {
            // Currently we handle transposition by explicitly precomputing transposed matrices
            // and calling the operation again without transposition
            // TODO: At least use workspaces to allow control of allocations. Maybe
            // consider implementing certain patterns (like A^T * B) explicitly
            let a_ref: &CsrMatrix<T> = a.inner_ref();
            let b_ref: &CsrMatrix<T> = b.inner_ref();
            let (a, b) = {
                use Cow::*;
                match (&a, &b) {
                    (NoOp(_), NoOp(_)) => unreachable!(),
                    (Transpose(ref a), NoOp(_)) => (Owned(a.transpose()), Borrowed(b_ref)),
                    (NoOp(_), Transpose(ref b)) => (Borrowed(a_ref), Owned(b.transpose())),
                    (Transpose(ref a), Transpose(ref b)) => (Owned(a.transpose()), Owned(b.transpose()))
                }
            };

            spmm_csr(beta, c, alpha, NoOp(a.as_ref()), NoOp(b.as_ref()))
        }
    }
}
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`use crate::csr::CsrMatrix;`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`use crate::ops::{Op};`
Implement spmm_pattern 2020-12-14 23:55:06 +08:00			`use crate::SparseEntryMut;`
			`use crate::ops::serial::{OperationError, OperationErrorType};`
Simplify transposition API in spmm_csr_dense 2020-12-03 00:04:19 +08:00			`use nalgebra::{Scalar, DMatrixSlice, ClosedAdd, ClosedMul, DMatrixSliceMut};`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`use num_traits::{Zero, One};`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`use std::sync::Arc;`
Implement spmm_pattern 2020-12-14 23:55:06 +08:00			`use std::borrow::Cow;`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			/// Sparse-dense matrix-matrix multiplication `C <- beta * C + alpha * op(A) * op(B)`.
Reorder parameters in ops to intuitive order 2020-12-21 22:42:32 +08:00			`pub fn spmm_csr_dense<'a, T>(beta: T,`
			`c: impl Into<DMatrixSliceMut<'a, T>>,`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`alpha: T,`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`a: Op<&CsrMatrix<T>>,`
			`b: Op<impl Into<DMatrixSlice<'a, T>>>)`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`where`
			`T: Scalar + ClosedAdd + ClosedMul + Zero + One`
			`{`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`let b = b.convert();`
Reorder parameters in ops to intuitive order 2020-12-21 22:42:32 +08:00			`spmm_csr_dense_(beta, c.into(), alpha, a, b)`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`}`

Reorder parameters in ops to intuitive order 2020-12-21 22:42:32 +08:00			`fn spmm_csr_dense_<T>(beta: T,`
			`mut c: DMatrixSliceMut<T>,`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`alpha: T,`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`a: Op<&CsrMatrix<T>>,`
			`b: Op<DMatrixSlice<T>>)`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`where`
			`T: Scalar + ClosedAdd + ClosedMul + Zero + One`
			`{`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`assert_compatible_spmm_dims!(c, a, b);`

			`match a {`
			`Op::Transpose(ref a) => {`
			`// In this case, we have to pre-multiply C by beta`
			`c *= beta;`

			`for k in 0..a.nrows() {`
			`let a_row_k = a.row(k);`
			`for (&i, a_ki) in a_row_k.col_indices().iter().zip(a_row_k.values()) {`
			`let gamma_ki = alpha.inlined_clone() * a_ki.inlined_clone();`
			`let mut c_row_i = c.row_mut(i);`
			`match b {`
			`Op::NoOp(ref b) => {`
			`let b_row_k = b.row(k);`
			`for (c_ij, b_kj) in c_row_i.iter_mut().zip(b_row_k.iter()) {`
			`c_ij += gamma_ki.inlined_clone() b_kj.inlined_clone();`
			`}`
			`},`
			`Op::Transpose(ref b) => {`
			`let b_col_k = b.column(k);`
			`for (c_ij, b_jk) in c_row_i.iter_mut().zip(b_col_k.iter()) {`
			`c_ij += gamma_ki.inlined_clone() b_jk.inlined_clone();`
			`}`
			`},`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`}`
			`}`
			`}`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`},`
			`Op::NoOp(ref a) => {`
			`for j in 0..c.ncols() {`
			`let mut c_col_j = c.column_mut(j);`
			`for (c_ij, a_row_i) in c_col_j.iter_mut().zip(a.row_iter()) {`
			`let mut dot_ij = T::zero();`
			`for (&k, a_ik) in a_row_i.col_indices().iter().zip(a_row_i.values()) {`
			`let b_contrib =`
			`match b {`
			`Op::NoOp(ref b) => b.index((k, j)),`
			`Op::Transpose(ref b) => b.index((j, k))`
			`};`
			`dot_ij += a_ik.inlined_clone() * b_contrib.inlined_clone();`
			`}`
			`c_ij = beta.inlined_clone() c_ij.inlined_clone() + alpha.inlined_clone() * dot_ij;`
Implement spmm_csr_dense 2020-12-02 23:56:22 +08:00			`}`
			`}`
			`}`
			`}`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`}`

			`fn spadd_csr_unexpected_entry() -> OperationError {`
			`OperationError::from_type_and_message(`
			`OperationErrorType::InvalidPattern,`
			String::from("Found entry in `a` that is not present in `c`."))
			`}`

Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			/// Sparse matrix addition `C <- beta * C + alpha * op(A)`.
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`///`
			/// If the pattern of `c` does not accommodate all the non-zero entries in `a`, an error is
			`/// returned.`
Reorder parameters in ops to intuitive order 2020-12-21 22:42:32 +08:00			`pub fn spadd_csr<T>(beta: T,`
			`c: &mut CsrMatrix<T>,`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`alpha: T,`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`a: Op<&CsrMatrix<T>>)`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`-> Result<(), OperationError>`
			`where`
			`T: Scalar + ClosedAdd + ClosedMul + Zero + One`
			`{`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`assert_compatible_spadd_dims!(c, a);`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00
			// TODO: Change CsrMatrix::pattern() to return `&Arc` instead of `Arc`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`if Arc::ptr_eq(&c.pattern(), &a.inner_ref().pattern()) {`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`// Special fast path: The two matrices have exactly the same sparsity pattern,`
			`// so we only need to sum the value arrays`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`for (c_ij, a_ij) in c.values_mut().iter_mut().zip(a.inner_ref().values()) {`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`let (alpha, beta) = (alpha.inlined_clone(), beta.inlined_clone());`
			`c_ij = beta c_ij.inlined_clone() + alpha * a_ij.inlined_clone();`
			`}`
			`Ok(())`
			`} else {`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`if let Op::Transpose(a) = a`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`{`
			`if beta != T::one() {`
			`for c_ij in c.values_mut() {`
			`c_ij = beta.inlined_clone();`
			`}`
			`}`

			`for (i, a_row_i) in a.row_iter().enumerate() {`
			`for (&j, a_val) in a_row_i.col_indices().iter().zip(a_row_i.values()) {`
			`let a_val = a_val.inlined_clone();`
			`let alpha = alpha.inlined_clone();`
			`match c.index_entry_mut(j, i) {`
			`SparseEntryMut::NonZero(c_ji) => { c_ji += alpha a_val }`
			`SparseEntryMut::Zero => return Err(spadd_csr_unexpected_entry()),`
			`}`
			`}`
			`}`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`} else if let Op::NoOp(a) = a {`
Implement CSR-CSR addition 2020-12-10 20:30:37 +08:00			`for (mut c_row_i, a_row_i) in c.row_iter_mut().zip(a.row_iter()) {`
			`if beta != T::one() {`
			`for c_ij in c_row_i.values_mut() {`
			`c_ij = beta.inlined_clone();`
			`}`
			`}`

			`let (mut c_cols, mut c_vals) = c_row_i.cols_and_values_mut();`
			`let (a_cols, a_vals) = (a_row_i.col_indices(), a_row_i.values());`

			`for (a_col, a_val) in a_cols.iter().zip(a_vals) {`
			`// TODO: Use exponential search instead of linear search.`
			`// If C has substantially more entries in the row than A, then a line search`
			`// will needlessly visit many entries in C.`
			`let (c_idx, _) = c_cols.iter()`
			`.enumerate()`
			`.find(\|(_, c_col)\| *c_col == a_col)`
			`.ok_or_else(spadd_csr_unexpected_entry)?;`
			`c_vals[c_idx] += alpha.inlined_clone() * a_val.inlined_clone();`
			`c_cols = &c_cols[c_idx ..];`
			`c_vals = &mut c_vals[c_idx ..];`
			`}`
			`}`
			`}`
			`Ok(())`
			`}`
			`}`

Implement spmm_csr 2020-12-16 21:06:12 +08:00			`fn spmm_csr_unexpected_entry() -> OperationError {`
			`OperationError::from_type_and_message(`
			`OperationErrorType::InvalidPattern,`
			String::from("Found unexpected entry that is not present in `c`."))
			`}`

			/// Sparse-sparse matrix multiplication, `C <- beta * C + alpha * op(A) * op(B)`.
Reorder parameters in ops to intuitive order 2020-12-21 22:42:32 +08:00			`pub fn spmm_csr<T>(`
Implement spmm_csr 2020-12-16 21:06:12 +08:00			`beta: T,`
Reorder parameters in ops to intuitive order 2020-12-21 22:42:32 +08:00			`c: &mut CsrMatrix<T>,`
Implement spmm_csr 2020-12-16 21:06:12 +08:00			`alpha: T,`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`a: Op<&CsrMatrix<T>>,`
			`b: Op<&CsrMatrix<T>>)`
Implement spmm_csr 2020-12-16 21:06:12 +08:00			`-> Result<(), OperationError>`
			`where`
			`T: Scalar + ClosedAdd + ClosedMul + Zero + One`
			`{`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`assert_compatible_spmm_dims!(c, a, b);`
Implement spmm_csr 2020-12-16 21:06:12 +08:00
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`use Op::{NoOp, Transpose};`
Implement spmm_csr 2020-12-16 21:06:12 +08:00
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`match (&a, &b) {`
			`(NoOp(ref a), NoOp(ref b)) => {`
			`for (mut c_row_i, a_row_i) in c.row_iter_mut().zip(a.row_iter()) {`
			`for c_ij in c_row_i.values_mut() {`
			`c_ij = beta.inlined_clone() c_ij.inlined_clone();`
			`}`
Implement spmm_csr 2020-12-16 21:06:12 +08:00
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`for (&k, a_ik) in a_row_i.col_indices().iter().zip(a_row_i.values()) {`
			`let b_row_k = b.row(k);`
			`let (mut c_row_i_cols, mut c_row_i_values) = c_row_i.cols_and_values_mut();`
			`let alpha_aik = alpha.inlined_clone() * a_ik.inlined_clone();`
			`for (j, b_kj) in b_row_k.col_indices().iter().zip(b_row_k.values()) {`
			`// Determine the location in C to append the value`
			`let (c_local_idx, _) = c_row_i_cols.iter()`
			`.enumerate()`
			`.find(\|(_, c_col)\| *c_col == j)`
			`.ok_or_else(spmm_csr_unexpected_entry)?;`

			`c_row_i_values[c_local_idx] += alpha_aik.inlined_clone() * b_kj.inlined_clone();`
			`c_row_i_cols = &c_row_i_cols[c_local_idx ..];`
			`c_row_i_values = &mut c_row_i_values[c_local_idx ..];`
			`}`
Implement spmm_csr 2020-12-16 21:06:12 +08:00			`}`
			`}`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`Ok(())`
			`},`
			`_ => {`
			`// Currently we handle transposition by explicitly precomputing transposed matrices`
			`// and calling the operation again without transposition`
			`// TODO: At least use workspaces to allow control of allocations. Maybe`
			`// consider implementing certain patterns (like A^T * B) explicitly`
			`let a_ref: &CsrMatrix<T> = a.inner_ref();`
			`let b_ref: &CsrMatrix<T> = b.inner_ref();`
			`let (a, b) = {`
			`use Cow::*;`
			`match (&a, &b) {`
			`(NoOp(_), NoOp(_)) => unreachable!(),`
			`(Transpose(ref a), NoOp(_)) => (Owned(a.transpose()), Borrowed(b_ref)),`
			`(NoOp(_), Transpose(ref b)) => (Borrowed(a_ref), Owned(b.transpose())),`
			`(Transpose(ref a), Transpose(ref b)) => (Owned(a.transpose()), Owned(b.transpose()))`
			`}`
			`};`
Implement spmm_csr 2020-12-16 21:06:12 +08:00
Reorder parameters in ops to intuitive order 2020-12-21 22:42:32 +08:00			`spmm_csr(beta, c, alpha, NoOp(a.as_ref()), NoOp(b.as_ref()))`
Refactor ops to use new Op type instead of separate Transpose flag 2020-12-21 22:09:29 +08:00			`}`
Implement spmm_csr 2020-12-16 21:06:12 +08:00			`}`
			`}`