Yannick Estève / ONTRAC-Kaldi

Blame view

src/matrix/sparse-matrix.h 16.6 KB
  // matrix/sparse-matrix.h
  
  // Copyright  2015  Johns Hopkins University (author: Daniel Povey)
  //            2015  Guoguo Chen
  //            2017  Shiyin Kang
  
  
  // See ../../COPYING for clarification regarding multiple authors
  //
  // Licensed under the Apache License, Version 2.0 (the "License");
  // you may not use this file except in compliance with the License.
  // You may obtain a copy of the License at
  //
  //  http://www.apache.org/licenses/LICENSE-2.0
  //
  // THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  // KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
  // WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
  // MERCHANTABLITY OR NON-INFRINGEMENT.
  // See the Apache 2 License for the specific language governing permissions and
  // limitations under the License.
  
  #ifndef KALDI_MATRIX_SPARSE_MATRIX_H_
  #define KALDI_MATRIX_SPARSE_MATRIX_H_ 1
  
  #include <utility>
  #include <vector>
  
  #include "matrix/matrix-common.h"
  #include "matrix/kaldi-matrix.h"
  #include "matrix/kaldi-vector.h"
  #include "matrix/compressed-matrix.h"
  
  namespace kaldi {
  
  
  /// \addtogroup matrix_group
  /// @{
  
  template <typename Real>
  class SparseVector {
   public:
    MatrixIndexT Dim() const { return dim_; }
  
    Real Sum() const;
  
    template <class OtherReal>
    void CopyElementsToVec(VectorBase<OtherReal> *vec) const;
  
    // *vec += alpha * *this.
    template <class OtherReal>
    void AddToVec(Real alpha,
                  VectorBase<OtherReal> *vec) const;
  
    template <class OtherReal>
    void CopyFromSvec(const SparseVector<OtherReal> &other);
  
    SparseVector<Real> &operator = (const SparseVector<Real> &other);
  
    SparseVector(const SparseVector<Real> &other) { *this = other; }
  
    void Swap(SparseVector<Real> *other);
  
    // Returns the maximum value in this row and outputs the index associated with
    // it.  This is not the index into the Data() pointer, it is the index into
    // the vector it represents, i.e. the .first value in the pair.
    // If this vector's Dim() is zero it is an error to call this function.
    // If all the elements stored were negative and there underlying vector had
    // zero indexes not listed in the elements, or if no elements are stored, it
    // will return the first un-listed index, whose value (implicitly) is zero.
    Real Max(int32 *index) const;
  
    /// Returns the number of nonzero elements.
    MatrixIndexT NumElements() const { return pairs_.size(); }
  
    /// get an indexed element (0 <= i < NumElements()).
    const std::pair<MatrixIndexT, Real> &GetElement(MatrixIndexT i) const {
      return pairs_[i];
    }
  
    // returns pointer to element data, or NULL if empty (use with NumElements()).
    std::pair<MatrixIndexT, Real> *Data();
  
    // returns pointer to element data, or NULL if empty (use with NumElements());
    // const version
    const std::pair<MatrixIndexT, Real> *Data() const;
  
    /// Sets elements to zero with probability zero_prob, else normally
    /// distributed.  Useful in testing.
    void SetRandn(BaseFloat zero_prob);
  
    SparseVector(): dim_(0) { }
  
    explicit SparseVector(MatrixIndexT dim): dim_(dim) { KALDI_ASSERT(dim >= 0); }
  
    // constructor from pairs; does not assume input pairs are sorted and uniq
    SparseVector(MatrixIndexT dim,
                 const std::vector<std::pair<MatrixIndexT, Real> > &pairs);
  
    // constructor from a VectorBase that keeps only the nonzero elements of 'vec'.
    explicit SparseVector(const VectorBase<Real> &vec);
  
    /// Resizes to this dimension.  resize_type == kUndefined
    /// behaves the same as kSetZero.
    void Resize(MatrixIndexT dim, MatrixResizeType resize_type = kSetZero);
  
    void Write(std::ostream &os, bool binary) const;
  
    void Read(std::istream &os, bool binary);
  
    /// Scale all elements of sparse vector.
    void Scale(Real alpha);
  
   private:
    MatrixIndexT dim_;
    // pairs of (row-index, value).  Stored in sorted order with no duplicates.
    // For now we use std::vector, but we could change this.
    std::vector<std::pair<MatrixIndexT, Real> > pairs_;
  };
  
  
  template <typename Real>
  Real VecSvec(const VectorBase<Real> &vec,
               const SparseVector<Real> &svec);
  
  
  
  template <typename Real>
  class SparseMatrix {
   public:
    MatrixIndexT NumRows() const;
  
    MatrixIndexT NumCols() const;
  
    MatrixIndexT NumElements() const;
  
    Real Sum() const;
  
    Real FrobeniusNorm() const;
  
  
    /// This constructor creates a SparseMatrix that just contains the nonzero
    /// elements of 'mat'.
    explicit SparseMatrix(const MatrixBase<Real> &mat);
  
    /// Copy to matrix.  It must already have the correct size.
    template <class OtherReal>
    void CopyToMat(MatrixBase<OtherReal> *other,
                   MatrixTransposeType t = kNoTrans) const;
  
    /// Copies the values of all the elements in SparseMatrix into a VectorBase
    /// object.
    void CopyElementsToVec(VectorBase<Real> *other) const;
  
    /// Copies data from another sparse matrix.
    template<class OtherReal>
    void CopyFromSmat(const SparseMatrix<OtherReal> &other,
                      MatrixTransposeType trans = kNoTrans);
  
    /// Does *other = *other + alpha * *this.
    void AddToMat(BaseFloat alpha, MatrixBase<Real> *other,
                  MatrixTransposeType t = kNoTrans) const;
  
    SparseMatrix<Real> &operator = (const SparseMatrix<Real> &other);
  
    SparseMatrix(const SparseMatrix<Real> &other, MatrixTransposeType trans =
                     kNoTrans) {
      this->CopyFromSmat(other, trans);
    }
  
    void Swap(SparseMatrix<Real> *other);
  
    // returns pointer to element data, or NULL if empty (use with NumElements()).
    SparseVector<Real> *Data();
  
    // returns pointer to element data, or NULL if empty (use with NumElements());
    // const version
    const SparseVector<Real> *Data() const;
  
    // initializer from the type that elsewhere in Kaldi is referred to as type
    // Posterior. indexed first by row-index; the pairs are (column-index, value),
    // and the constructor does not require them to be sorted and uniq.
    SparseMatrix(
        int32 dim,
        const std::vector<std::vector<std::pair<MatrixIndexT, Real> > > &pairs);
  
    /// Sets up to a pseudo-randomly initialized matrix, with each element zero
    /// with probability zero_prob and else normally distributed- mostly for
    /// purposes of testing.
    void SetRandn(BaseFloat zero_prob);
  
    void Write(std::ostream &os, bool binary) const;
  
    void Read(std::istream &os, bool binary);
  
    const SparseVector<Real> &Row(MatrixIndexT r) const;
  
    /// Sets row r to "vec"; makes sure it has the correct dimension.
    void SetRow(int32 r, const SparseVector<Real> &vec);
  
    /// Select a subset of the rows of a SparseMatrix.
    /// Sets *this to only the rows of 'smat_other' that are listed
    /// in 'row_indexes'.
    /// 'row_indexes' must satisfy 0 <= row_indexes[i] < smat_other.NumRows().
    void SelectRows(const std::vector<int32> &row_indexes,
                    const SparseMatrix<Real> &smat_other);
  
  
    /// Sets *this to all the rows of *inputs appended together; this
    /// function is destructive of the inputs.  Requires, obviously,
    /// that the inputs all have the same dimension (although some may be
    /// empty).
    void AppendSparseMatrixRows(std::vector<SparseMatrix<Real> > *inputs);
  
    SparseMatrix() { }
  
    SparseMatrix(int32 num_rows, int32 num_cols) { Resize(num_rows, num_cols); }
  
    /// Constructor from an array of indexes.
    /// If trans == kNoTrans, construct a sparse matrix
    /// with num-rows == indexes.Dim() and num-cols = 'dim'.
    /// 'indexes' is expected to contain elements in the
    /// range [0, dim - 1].  Each row 'i' of *this after
    /// calling the constructor will contain  a single
    /// element at column-index indexes[i] with value 1.0.
    ///
    /// If trans == kTrans, the result will be the transpose
    /// of the sparse matrix described above.
    SparseMatrix(const std::vector<int32> &indexes, int32 dim,
                 MatrixTransposeType trans = kNoTrans);
  
    /// Constructor from an array of indexes and an array of
    /// weights; requires indexes.Dim() == weights.Dim().
    /// If trans == kNoTrans, construct a sparse matrix
    /// with num-rows == indexes.Dim() and num-cols = 'dim'.
    /// 'indexes' is expected to contain elements in the
    /// range [0, dim - 1].  Each row 'i' of *this after
    /// calling the constructor will contain a single
    /// element at column-index indexes[i] with value weights[i].
    /// If trans == kTrans, the result will be the transpose
    /// of the sparse matrix described above.
    SparseMatrix(const std::vector<int32> &indexes,
                 const VectorBase<Real> &weights, int32 dim,
                 MatrixTransposeType trans = kNoTrans);
  
    /// Resizes the matrix; analogous to Matrix::Resize().  resize_type ==
    /// kUndefined behaves the same as kSetZero.
    void Resize(MatrixIndexT rows, MatrixIndexT cols,
                MatrixResizeType resize_type = kSetZero);
  
    /// Scale all elements in sparse matrix.
    void Scale(Real alpha);
  
    // Use the Matrix::CopyFromSmat() function to copy from this to Matrix.  Also
    // see Matrix::AddSmat().  There is not very extensive functionality for
    // SparseMat just yet (e.g. no matrix multiply); we will add things as needed
    // and as it seems necessary.
   private:
    // vector of SparseVectors, all of same dime (use an stl vector for now; this
    // could change).
    std::vector<SparseVector<Real> > rows_;
  };
  
  
  template<typename Real>
  Real TraceMatSmat(const MatrixBase<Real> &A,
                    const SparseMatrix<Real> &B,
                    MatrixTransposeType trans = kNoTrans);
  
  
  enum GeneralMatrixType {
    kFullMatrix,
    kCompressedMatrix,
    kSparseMatrix
  };
  
  /// This class is a wrapper that enables you to store a matrix
  /// in one of three forms: either as a Matrix<BaseFloat>, or a CompressedMatrix,
  /// or a SparseMatrix<BaseFloat>.  It handles the I/O for you, i.e. you read
  /// and write a single object type.  It is useful for neural-net training
  /// targets which might be sparse or not, and might be compressed or not.
  class GeneralMatrix {
   public:
    /// Returns the type of the matrix: kSparseMatrix, kCompressedMatrix or
    /// kFullMatrix.  If this matrix is empty, returns kFullMatrix.
    GeneralMatrixType Type() const;
  
    void Compress();  // If it was a full matrix, compresses, changing Type() to
                      // kCompressedMatrix; otherwise does nothing.
  
    void Uncompress();  // If it was a compressed matrix, uncompresses, changing
                        // Type() to kFullMatrix; otherwise does nothing.
  
    void Write(std::ostream &os, bool binary) const;
  
  
    /// Note: if you write a compressed matrix in text form, it will be read as
    /// a regular full matrix.
    void Read(std::istream &is, bool binary);
  
    /// Returns the contents as a SparseMatrix.  This will only work if
    /// Type() returns kSparseMatrix, or NumRows() == 0; otherwise it will crash.
    const SparseMatrix<BaseFloat> &GetSparseMatrix() const;
  
    /// Swaps the with the given SparseMatrix.  This will only work if
    /// Type() returns kSparseMatrix, or NumRows() == 0.
    void SwapSparseMatrix(SparseMatrix<BaseFloat> *smat);
  
    /// Returns the contents as a compressed matrix.  This will only work if
    /// Type() returns kCompressedMatrix, or NumRows() == 0; otherwise it will
    /// crash.
    const CompressedMatrix &GetCompressedMatrix() const;
  
    /// Swaps the with the given CompressedMatrix.  This will only work if
    /// Type() returns kCompressedMatrix, or NumRows() == 0.
    void SwapCompressedMatrix(CompressedMatrix *cmat);
  
    /// Returns the contents as a Matrix<BaseFloat>.  This will only work if
    /// Type() returns kFullMatrix, or NumRows() == 0; otherwise it will crash.
    const Matrix<BaseFloat>& GetFullMatrix() const;
  
    /// Outputs the contents as a matrix.  This will work regardless of
    /// Type().  Sizes its output, unlike CopyToMat().
    void GetMatrix(Matrix<BaseFloat> *mat) const;
  
    /// Swaps the with the given Matrix.  This will only work if
    /// Type() returns kFullMatrix, or NumRows() == 0.
    void SwapFullMatrix(Matrix<BaseFloat> *mat);
  
    /// Copies contents, regardless of type, to "mat", which must be correctly
    /// sized.  See also GetMatrix(), which will size its output for you.
    void CopyToMat(MatrixBase<BaseFloat> *mat,
                   MatrixTransposeType trans = kNoTrans) const;
  
    /// Copies contents, regardless of type, to "cu_mat", which must be
    /// correctly sized.  Implemented in ../cudamatrix/cu-sparse-matrix.cc
    void CopyToMat(CuMatrixBase<BaseFloat> *cu_mat,
                   MatrixTransposeType trans = kNoTrans) const;
  
    /// Adds alpha times *this to mat.
    void AddToMat(BaseFloat alpha, MatrixBase<BaseFloat> *mat,
                  MatrixTransposeType trans = kNoTrans) const;
  
    /// Adds alpha times *this to cu_mat.
    /// Implemented in ../cudamatrix/cu-sparse-matrix.cc
    void AddToMat(BaseFloat alpha, CuMatrixBase<BaseFloat> *cu_mat,
                  MatrixTransposeType trans = kNoTrans) const;
  
    /// Scale each element of matrix by alpha.
    void Scale(BaseFloat alpha);
  
    /// Assignment from regular matrix.
    GeneralMatrix &operator= (const MatrixBase<BaseFloat> &mat);
  
    /// Assignment from compressed matrix.
    GeneralMatrix &operator= (const CompressedMatrix &mat);
  
    /// Assignment from SparseMatrix<BaseFloat>
    GeneralMatrix &operator= (const SparseMatrix<BaseFloat> &smat);
  
    MatrixIndexT NumRows() const;
  
    MatrixIndexT NumCols() const;
  
    explicit GeneralMatrix(const MatrixBase<BaseFloat> &mat) { *this = mat; }
  
    explicit GeneralMatrix(const CompressedMatrix &cmat) { *this = cmat; }
  
    explicit GeneralMatrix(const SparseMatrix<BaseFloat> &smat) { *this = smat; }
  
    GeneralMatrix() { }
    // Assignment operator.
    GeneralMatrix &operator =(const GeneralMatrix &other);
    // Copy constructor
    GeneralMatrix(const GeneralMatrix &other) { *this = other; }
    // Sets to the empty matrix.
    void Clear();
    // shallow swap
    void Swap(GeneralMatrix *other);
   private:
    // We don't explicitly store the type of the matrix.  Rather, we make
    // sure that only one of the matrices is ever nonempty, and the Type()
    // returns that one, or kFullMatrix if all are empty.
    Matrix<BaseFloat> mat_;
    CompressedMatrix cmat_;
    SparseMatrix<BaseFloat> smat_;
  };
  
  
  /// Appends all the matrix rows of a list of GeneralMatrixes, to get a single
  /// GeneralMatrix.  Preserves sparsity if all inputs were sparse (or empty).
  /// Does not preserve compression, if inputs were compressed; you have to
  /// re-compress manually, if that's what you need.
  void AppendGeneralMatrixRows(const std::vector<const GeneralMatrix *> &src,
                               GeneralMatrix *mat);
  
  
  /// Outputs a SparseMatrix<Real> containing only the rows r of "in" such that
  /// keep_rows[r] == true.  keep_rows.size() must equal in.NumRows(), and rows
  /// must contain at least one "true" element.
  template <typename Real>
  void FilterSparseMatrixRows(const SparseMatrix<Real> &in,
                              const std::vector<bool> &keep_rows,
                              SparseMatrix<Real> *out);
  
  /// Outputs a Matrix<Real> containing only the rows r of "in" such that
  /// keep_keep_rows[r] == true.  keep_rows.size() must equal in.NumRows(), and
  /// keep_rows must contain at least one "true" element.
  template <typename Real>
  void FilterMatrixRows(const Matrix<Real> &in,
                        const std::vector<bool> &keep_rows,
                        Matrix<Real> *out);
  
  /// Outputs a Matrix<Real> containing only the rows r of "in" such that
  /// keep_rows[r] == true.  keep_rows.size() must equal in.NumRows(), and rows
  /// must contain at least one "true" element.
  void FilterCompressedMatrixRows(const CompressedMatrix &in,
                                  const std::vector<bool> &keep_rows,
                                  Matrix<BaseFloat> *out);
  
  
  /// Outputs a GeneralMatrix containing only the rows r of "in" such that
  /// keep_rows[r] == true.  keep_rows.size() must equal in.NumRows(), and
  /// keep_rows must contain at least one "true" element.  If in.Type() is
  /// kCompressedMatrix, the result will not be compressed; otherwise, the type
  /// is preserved.
  void FilterGeneralMatrixRows(const GeneralMatrix &in,
                               const std::vector<bool> &keep_rows,
                               GeneralMatrix *out);
  
  /// This function extracts a row-range of a GeneralMatrix and writes
  /// as a GeneralMatrix containing the same type of underlying
  /// matrix.  If the row-range is partly outside the row-range of 'in'
  /// (i.e. if row_offset < 0 or row_offset + num_rows > in.NumRows())
  /// then it will pad with copies of the first and last row as
  /// needed.
  /// This is more efficient than un-compressing and
  /// re-compressing the underlying CompressedMatrix, and causes
  /// less accuracy loss due to re-compression (no loss in most cases).
  void ExtractRowRangeWithPadding(
      const GeneralMatrix &in,
      int32 row_offset,
      int32 num_rows,
      GeneralMatrix *out);
  
  
  /// @} end of \addtogroup matrix_group
  
  
  }  // namespace kaldi
  
  #endif  // KALDI_MATRIX_SPARSE_MATRIX_H_