eigen/Eigen/src/SparseLU/SparseLU_column_dfs.h

// This file is part of Eigen, a lightweight C++ template library
// for linear algebra.
//
// Copyright (C) 2012 Désiré Nuentsa-Wakam <desire.nuentsa_wakam@inria.fr>
//
// This Source Code Form is subject to the terms of the Mozilla
// Public License v. 2.0. If a copy of the MPL was not distributed
// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.

/*

 * NOTE: This file is the modified version of [s,d,c,z]column_dfs.c file in SuperLU

 * -- SuperLU routine (version 2.0) --
 * Univ. of California Berkeley, Xerox Palo Alto Research Center,
 * and Lawrence Berkeley National Lab.
 * November 15, 1997
 *
 * Copyright (c) 1994 by Xerox Corporation.  All rights reserved.
 *
 * THIS MATERIAL IS PROVIDED AS IS, WITH ABSOLUTELY NO WARRANTY
 * EXPRESSED OR IMPLIED.  ANY USE IS AT YOUR OWN RISK.
 *
 * Permission is hereby granted to use or copy this program for any
 * purpose, provided the above notices are retained on all copies.
 * Permission to modify the code and to distribute modified code is
 * granted, provided the above notices are retained, and a notice that
 * the code was modified is included with the above copyright notice.
 */
#ifndef SPARSELU_COLUMN_DFS_H
#define SPARSELU_COLUMN_DFS_H
/**
 * \brief Performs a symbolic factorization on column jcol and decide the supernode boundary
 *
 * A supernode representative is the last column of a supernode.
 * The nonzeros in U[*,j] are segments that end at supernodes representatives.
 * The routine returns a list of the supernodal representatives
 * in topological order of the dfs that generates them.
 * The location of the first nonzero in each supernodal segment
 * (supernodal entry location) is also returned.
 *
 * \param m number of rows in the matrix
 * \param jcol Current column
 * \param perm_r Row permutation
 * \param maxsuper  Maximum number of column allowed in a supernode
 * \param [in,out] nseg Number of segments in current U[*,j] - new segments appended
 * \param lsub_col defines the rhs vector to start the dfs
 * \param [in,out] segrep Segment representatives - new segments appended
 * \param repfnz  First nonzero location in each row
 * \param xprune
 * \param marker  marker[i] == jj, if i was visited during dfs of current column jj;
 * \param parent
 * \param xplore working array
 * \param glu global LU data
 * \return 0 success
 *         > 0 number of bytes allocated when run out of space
 *
 */
template<typename IndexVector, typename ScalarVector>
struct LU_column_dfs_traits
{
  typedef typename IndexVector::Scalar Index;
  typedef typename ScalarVector::Scalar Scalar;
  LU_column_dfs_traits(Index jcol, Index& jsuper, LU_GlobalLU_t<IndexVector, ScalarVector>& glu)
   : m_jcol(jcol), m_jsuper_ref(jsuper), m_glu(glu)
 {}
  bool update_segrep(Index /*krep*/, Index /*jj*/)
  {
    return true;
  }
  void mem_expand(IndexVector& lsub, int& nextl, int chmark)
  {
    if (nextl >= m_glu.nzlmax)
      SparseLUBase<Scalar,Index>::LUMemXpand(lsub, m_glu.nzlmax, nextl, LSUB, m_glu.num_expansions);
    if (chmark != (m_jcol-1)) m_jsuper_ref = IND_EMPTY;
  }
  enum { ExpandMem = true };

  int m_jcol;
  int& m_jsuper_ref;
  LU_GlobalLU_t<IndexVector, ScalarVector>& m_glu;
};

template <typename Scalar, typename Index>
int SparseLUBase<Scalar,Index>::LU_column_dfs(const int m, const int jcol, IndexVector& perm_r, int maxsuper, int& nseg,  BlockIndexVector lsub_col, IndexVector& segrep, BlockIndexVector repfnz, IndexVector& xprune, IndexVector& marker, IndexVector& parent, IndexVector& xplore, GlobalLU_t& glu)
{

  int jsuper = glu.supno(jcol);
  int nextl = glu.xlsub(jcol);
  VectorBlock<IndexVector> marker2(marker, 2*m, m);


  LU_column_dfs_traits<IndexVector, ScalarVector> traits(jcol, jsuper, glu);

  // For each nonzero in A(*,jcol) do dfs
  for (int k = 0; lsub_col[k] != IND_EMPTY; k++)
  {
    int krow = lsub_col(k);
    lsub_col(k) = IND_EMPTY;
    int kmark = marker2(krow);

    // krow was visited before, go to the next nonz;
    if (kmark == jcol) continue;

    LU_dfs_kernel(jcol, perm_r, nseg, glu.lsub, segrep, repfnz, xprune, marker2, parent,
                   xplore, glu, nextl, krow, traits);
  } // for each nonzero ...

  int fsupc, jptr, jm1ptr, ito, ifrom, istop;
  int nsuper = glu.supno(jcol);
  int jcolp1 = jcol + 1;
  int jcolm1 = jcol - 1;

  // check to see if j belongs in the same supernode as j-1
  if ( jcol == 0 )
  { // Do nothing for column 0
    nsuper = glu.supno(0) = 0 ;
  }
  else
  {
    fsupc = glu.xsup(nsuper);
    jptr = glu.xlsub(jcol); // Not yet compressed
    jm1ptr = glu.xlsub(jcolm1);

    // Use supernodes of type T2 : see SuperLU paper
    if ( (nextl-jptr != jptr-jm1ptr-1) ) jsuper = IND_EMPTY;

    // Make sure the number of columns in a supernode doesn't
    // exceed threshold
    if ( (jcol - fsupc) >= maxsuper) jsuper = IND_EMPTY;

    /* If jcol starts a new supernode, reclaim storage space in
     * glu.lsub from previous supernode. Note we only store
     * the subscript set of the first and last columns of
     * a supernode. (first for num values, last for pruning)
     */
    if (jsuper == IND_EMPTY)
    { // starts a new supernode
      if ( (fsupc < jcolm1-1) )
      { // >= 3 columns in nsuper
        ito = glu.xlsub(fsupc+1);
        glu.xlsub(jcolm1) = ito;
        istop = ito + jptr - jm1ptr;
        xprune(jcolm1) = istop; // intialize xprune(jcol-1)
        glu.xlsub(jcol) = istop;

        for (ifrom = jm1ptr; ifrom < nextl; ++ifrom, ++ito)
          glu.lsub(ito) = glu.lsub(ifrom);
        nextl = ito;  // = istop + length(jcol)
      }
      nsuper++;
      glu.supno(jcol) = nsuper;
    } // if a new supernode
  } // end else:  jcol > 0

  // Tidy up the pointers before exit
  glu.xsup(nsuper+1) = jcolp1;
  glu.supno(jcolp1) = nsuper;
  xprune(jcol) = nextl;  // Intialize upper bound for pruning
  glu.xlsub(jcolp1) = nextl;

  return 0;
}
#endif