sym-ildl/html/lilc__matrix__ildl_8h_source.html

 #ifndef _LILC_MATRIX_ILDL_H_
 #define _LILC_MATRIX_ILDL_H_


 using std::endl;
 using std::cout;
 using std::abs;

 template <class el_type>
 void lilc_matrix<el_type> :: ildl(lilc_matrix<el_type>& L, block_diag_matrix<el_type>& D, idx_vector_type& perm, const double& fill_factor, const double& tol, const double& pp_tol, int piv_type)
 {

     //----------------- initialize temporary variables --------------------//
     const int ncols = n_cols(); //number of cols in A.

     int lfil;
     if (fill_factor > 1e4) lfil = ncols; //just incase users decide to enter a giant fill factor for fun...
     else lfil = 2*fill_factor*nnz()/ncols; //roughly a factor of 2 since only lower tri. of A is stored

     const el_type alpha = (1.0+sqrt(17.0))/8.0;  //for use in pivoting.
     el_type w1(-1), wr(-1), d1(-1), dr(-1);     //for use in bk-pivoting
     el_type det_D, D_inv11, D_inv22, D_inv12;   //for use in 2x2 pivots
     el_type l_11, l_12;                         //for use in 2x2 pivots

     vector<bool> in_set(ncols, false); //bitset used for unsorted merges
     swap_struct<el_type> s; //struct containing temp vars used in pivoting.

     elt_vector_type work(ncols, 0), temp(ncols, 0);
     idx_vector_type curr_nnzs, temp_nnzs;  //non-zeros on current col.
     curr_nnzs.reserve(ncols); //reserves space for worse case (entire col is non-zero)

     int count = 0; //the total number of nonzeros stored in L.
     int i, j, k, r, offset, col_size, col_size2(-1);
     bool size_two_piv = false;  //boolean indicating if the pivot is 2x2 or 1x1

     //--------------- allocate memory for L and D ------------------//
     L.resize(ncols, ncols); //allocate a vector of size n for Llist as well
     D.resize(ncols );

     //------------------- main loop: factoring begins -------------------------//
     for (k = 0; k < ncols; k++) {

         //curr nnz vector starts out empty and is cleared at the end of each loop iteration.
         //assign nonzeros indices of A(k:n, k) to curr_nnzs
         curr_nnzs.assign (m_idx[k].begin(), m_idx[k].end());

         //assign nonzero values of A(k:n, k) to work
         for (j = 0; j < (int) curr_nnzs.size(); j++) {
             work[curr_nnzs[j]] = m_x[k][j];
         }
         sort(curr_nnzs.begin(), curr_nnzs.end());

         //--------------begin pivoting--------------//
         // the pivoting below DEFINITELY needs to be refactored into a separate function

         //do delayed updates on current column. work = Sum_{i=0}^{k-1} L(k,i) * D(i,i) * L(k:n, i)
         //(the formula above generalizes to block matrix form in the case of 2x2 pivots).
         update(k, work, curr_nnzs, L, D, in_set);

         //store diagonal element in d1. set diagonal element in work vector to 0
         //since we want to find the maximum off-diagonal element.
         d1 = work[k];
         work[k] = 0;

         //find maximum element in work and store its index in r.
         w1 = max(work, curr_nnzs, r);

         if (piv_type == pivot_type::BKP) {
             //we do partial pivoting here, where we take the first element u in the column that satisfies
             //|u| > pp_tol*|wi|. for more information, consult "A Partial Pivoting Strategy for Sparse
             //Symmetric Matrix Decomposition" by J.H. Liu (1987).
             int t = r; //stores location of u
             el_type u = w1; //stores value of u
             for (i = 0; i < (int) curr_nnzs.size(); i++) {
                 if (abs(work[curr_nnzs[i]])-pp_tol*w1 > eps ) {
                     t = curr_nnzs[i];
                     u = work[t];
                     break;
                 }
             }

             //bunch-kaufman partial pivoting is used below. for a more detailed reference,
             //refer to "Accuracy and Stability of Numerical Algorithms." by Higham (2002).
             //------------------- begin bunch-kaufman pivoting ------------------//
             if (w1 < eps) {
                 //case 0: do nothing. pivot is k.
             } else if ( (alpha * w1 - abs(d1)) < eps  ) {
                 //case 1: do nothing. pivot is k.
             } else {
                 //since we are doing partial pivoting, we should treat u and t like wi and r, so
                 //we'll just reassign wi and r. note: this has to go in the else clause since
                 //we still use the old wi for case 0 and case 1.
                 w1 = u;
                 r = t;

                 offset = row_first[r];
                 //assign all nonzero indices and values in A(r, k:r)
                 //( not including A(r,r) ) to temp and temp_nnzs
                 for (j = offset; j < (int) list[r].size(); j++) {
                     temp_nnzs.push_back(list[r][j]);
                     temp[list[r][j]] = coeff(r, list[r][j]);
                 }

                 //assign nonzero indices of A(r:n, r) to temp_nnzs
                 temp_nnzs.insert(temp_nnzs.end(), m_idx[r].begin(), m_idx[r].end());

                 //assign nonzero values of to temp
                 for (j = 0; j < (int) m_idx[r].size(); j++) {
                     temp[m_idx[r][j]] = m_x[r][j];
                 }

                 //perform delayed updates on temp. temp = Sum_{i=0}^{k-1} L(r,i) * D(i,i) * L(k:n, i).
                 //(the formula above generalizes to block matrix form in the case of 2x2 pivots).
                 update(r, temp, temp_nnzs, L, D, in_set);

                 dr = temp[r];
                 temp[r] = 0;

                 //find maximum element in temp.
                 wr = max(temp, temp_nnzs, j);

                 if ((alpha*w1*w1 - abs(d1)*wr) < eps) {
                     //case 2: do nothing. pivot is k.

                 } else if ( (alpha * wr - abs(dr)) < eps) {
                     //case 3: pivot is k with r: 1x1 pivot case.
                     temp[r] = dr;
                     work[k] = d1;

                     //--------pivot A and L ---------//
                     pivot(s, in_set, L, k, r);

                     //----------pivot rest ----------//

                     //permute perm
                     std::swap(perm[k], perm[r]);

                     work.swap(temp);    //swap work with temp.
                     std::swap(work[k], work[r]); //swap kth and rth row of work

                     curr_nnzs.swap(temp_nnzs);  //swap curr_nnzs with temp_nnzs

                     safe_swap(curr_nnzs, k, r); //swap k and r if they are present in curr_nnzs

                     d1 = work[k];
                     //--------end pivot rest---------//

                 } else {
                     //case 4: pivot is k+1 with r: 2x2 pivot case.

                     //must advance list for 2x2 pivot since we are pivoting on col k+1
                     advance_list(k);
                     //for the same reason as above, we must advance L.first as well
                     L.advance_first(k);

                     //restore diagonal elements in work and temp
                     temp[r] = dr;
                     work[k] = d1;

                     //indicate that pivot is 2x2
                     size_two_piv = true;

                     if (k+1 < r) {
                         //symmetrically permute row/col k+1 and r.
                         pivot(s, in_set, L, k+1, r);

                         //----------pivot rest ----------//

                         //permute perm
                         std::swap(perm[k+1], perm[r]);

                         //swap rows k+1 and r of work and temp
                         std::swap(work[k+1], work[r]);
                         std::swap(temp[k+1], temp[r]);

                         //swap k+1 and r in curr_nnzs and temp_nnzs
                         safe_swap(curr_nnzs, k+1, r);
                         safe_swap(temp_nnzs, k+1, r);
                     }

                     d1 = work[k];
                     dr = temp[k+1];
                 }
             }
             //--------------end bkp pivoting--------------//
         } else if (piv_type == pivot_type::ROOK) {
             //--------------begin rook pivoting--------------//
             i = k;
             work[k] = d1;

             if (alpha * w1 <= abs(d1) + eps) {
                 // do nothing
             } else {
                 while (true) {
                     // assign nonzeros indices and values of A(r:n, r) to col_r_nnzs
                     for (idx_it it = temp_nnzs.begin(); it != temp_nnzs.end(); it++) {
                         temp[*it] = 0;
                     }
                     temp_nnzs.clear();

                     offset = row_first[r];
                     //assign all nonzero indices and values in A(r, k:r)
                     //( not including A(r,r) ) to temp and temp_nnzs
                     for (j = offset; j < (int) list[r].size(); j++) {
                         temp_nnzs.push_back(list[r][j]);
                         temp[list[r][j]] = coeff(r, list[r][j]);
                     }

                     //assign nonzero indices of A(r:n, r) to temp_nnzs
                     temp_nnzs.insert(temp_nnzs.end(), m_idx[r].begin(), m_idx[r].end());

                     //assign nonzero values of to temp
                     for (j = 0; j < (int) m_idx[r].size(); j++) {
                         temp[m_idx[r][j]] = m_x[r][j];
                     }

                     //perform delayed updates on temp. temp = Sum_{i=0}^{k-1} L(r,i) * D(i,i) * L(k:n, i).
                     //(the formula above generalizes to block matrix form in the case of 2x2 pivots).
                     update(r, temp, temp_nnzs, L, D, in_set);

                     dr = temp[r];
                     temp[r] = 0;

                     //find maximum element in temp.
                     wr = max(temp, temp_nnzs, j);
                     temp[r] = dr;

                     if (alpha * wr <= abs(dr) + eps) {
                         // swap rows and columns k and r
                         pivot(s, in_set, L, k, r);

                         std::swap(perm[k], perm[r]);

                         std::swap(temp[k], temp[r]);
                         work.swap(temp);

                         safe_swap(temp_nnzs, k, r);
                         curr_nnzs.swap(temp_nnzs);

                         d1 = work[k];
                         break;
                     } else if (abs(w1 - wr) < eps) {
                         size_two_piv = true;
                         // swap rows and columns k and i, k+1 and r
                         if (k != i) {
                             //symmetrically permute row/col k and i.
                             pivot(s, in_set, L, k, i);

                             //----------pivot rest ----------//

                             //permute perm
                             std::swap(perm[k], perm[i]);

                             //swap rows k and i of work and temp
                             std::swap(work[k], work[i]);
                             std::swap(temp[k], temp[i]);

                             //swap k+1 and r in curr_nnzs and temp_nnzs
                             safe_swap(curr_nnzs, k, i);
                             safe_swap(temp_nnzs, k, i);

                             d1 = work[k];
                         }

                         advance_list(k);
                         L.advance_first(k);

                         if (k+1 < r) {
                             //symmetrically permute row/col k+1 and r.
                             pivot(s, in_set, L, k+1, r);

                             //----------pivot rest ----------//

                             //permute perm
                             std::swap(perm[k+1], perm[r]);

                             //swap rows k+1 and r of work and temp
                             std::swap(work[k+1], work[r]);
                             std::swap(temp[k+1], temp[r]);

                             //swap k+1 and r in curr_nnzs and temp_nnzs
                             safe_swap(curr_nnzs, k+1, r);
                             safe_swap(temp_nnzs, k+1, r);

                             dr = temp[k+1];
                         }
                         break;
                     } else {
                         i = r;
                         w1 = wr;
                         r = j;
                         work.swap(temp);
                         curr_nnzs.swap(temp_nnzs);
                     }
                 }
             }
             //--------------end rook pivoting--------------//
         }

         //erase diagonal element from non-zero indices (to exclude it from being dropped)
         curr_nnzs.erase(std::remove(curr_nnzs.begin(), curr_nnzs.end(), k), curr_nnzs.end());

         //performs the dual dropping procedure.
         if (!size_two_piv) {
             //perform dual dropping criteria on work
             drop_tol(work, curr_nnzs, lfil, tol);

         } else {
             //erase diagonal 2x2 block from non-zero indices (to exclude it from being dropped)
             temp_nnzs.erase(std::remove(temp_nnzs.begin(), temp_nnzs.end(), k), temp_nnzs.end());
             curr_nnzs.erase(std::remove(curr_nnzs.begin(), curr_nnzs.end(), k+1), curr_nnzs.end());
             temp_nnzs.erase(std::remove(temp_nnzs.begin(), temp_nnzs.end(), k+1), temp_nnzs.end());

             //compute inverse of the 2x2 block diagonal pivot.
             det_D = d1*dr - work[k+1]*work[k+1];
             if ( abs(det_D) < eps) det_D = 1e-6;  //statically pivot;
             D_inv11 = dr/det_D;
             D_inv22 = d1/det_D;
             D_inv12 = -work[k+1]/det_D;

             //assign pivot to D (d1 is assigned to D(k,k) later)
             D.off_diagonal(k) = work[k+1];
             D[k+1] = dr;

             //merge nonzeros of curr and temp together so iterating through them will be easier
             unordered_inplace_union(curr_nnzs, temp_nnzs.begin(), temp_nnzs.end(), in_set);


             //multiply inverse of pivot to work and temp (gives us two columns of l)
             for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
                 l_11 = work[*it]*D_inv11 + temp[*it]*D_inv12;
                 l_12 = work[*it]*D_inv12 + temp[*it]*D_inv22;

                 //note that work and temp roughly share the same non-zero indices
                 work[*it] = l_11;
                 temp[*it] = l_12;
             }

             //since the work and temp non-zero indices are roughly the same,
             //we can copy it over to temp_nnzs
             temp_nnzs.assign(curr_nnzs.begin(), curr_nnzs.end());

             //perform dual dropping procedure on work and temp
             drop_tol(temp, temp_nnzs, lfil, tol);
             drop_tol(work, curr_nnzs, lfil, tol);


         }

         //resize kth column of L to proper size.
         L.m_idx[k].resize(curr_nnzs.size()+1);
         L.m_x[k].resize(curr_nnzs.size()+1);

         //assign diagonal element to D
         D[k] = d1;

         //assign 1s to diagonal of L.
         L.m_x[k][0] = 1;
         L.m_idx[k][0] = k;
         count++;

         if (!size_two_piv) {
             if ( abs(D[k]) < eps) D[k] = 1e-6; //statically pivot
             i = 1;
             for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
                 if ( abs(work[*it]) > eps) {
                     L.m_idx[k][i] = *it; //col k nonzero indices of L are stored
                     L.m_x[k][i] = work[*it]/D[k]; //col k nonzero values of L are stored

                     L.list[*it].push_back(k); //update Llist
                     count++;
                     i++;
                 }
             }

             col_size = i;

             //advance list and L.first
             L.advance_first(k);
             advance_list(k);
         } else {
             //resize k+1th column of L to proper size.
             L.m_idx[k+1].resize(temp_nnzs.size()+1);
             L.m_x[k+1].resize(temp_nnzs.size()+1);

             //assign 1s to diagonal of L.
             L.m_x[k+1][0] = 1;
             L.m_idx[k+1][0] = k+1;
             count++;

             i = 1;
             for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
                 if ( abs(work[*it]) > eps) {
                     L.m_x[k][i] = work[*it]; //col k nonzero indices of L are stored
                     L.m_idx[k][i] = *it; //col k nonzero values of L are stored

                     L.list[*it].push_back(k); //update L.list
                     count++;
                     i++;
                 }

             }

             j = 1;
             for (idx_it it = temp_nnzs.begin(); it != temp_nnzs.end(); it++) {
                 if ( abs(temp[*it]) > eps) {
                     L.m_x[k+1][j] = temp[*it]; //col k+1 nonzero indices of L are stored
                     L.m_idx[k+1][j] = *it; //col k+1 nonzero values of L are stored

                     L.list[*it].push_back(k+1); //update L.list
                     count++;
                     j++;
                 }

             }

             col_size = i;
             col_size2 = j;

             //update list and L.first
             L.advance_first(k+1);
             advance_list(k+1);

         }

         // ------------- reset temp and work back to zero -----------------//
         work[k] = 0;
         temp[k] = 0;

         if (k + 1 < ncols) {
             temp[k+1] = 0;
             work[k+1] = 0;
         }

         for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
             work[*it] = 0;
         }
         curr_nnzs.clear(); //zero out work vector

         for (idx_it it = temp_nnzs.begin(); it != temp_nnzs.end(); it++) {
             temp[*it] = 0;
         }
         temp_nnzs.clear(); //zero out work vector

         //-------------------------------------------------------------------//

         //resize columns of L to correct size
         L.m_x[k].resize(col_size);
         L.m_idx[k].resize(col_size);

         if (size_two_piv) {
             L.m_x[k+1].resize(col_size2);
             L.m_idx[k+1].resize(col_size2);
             k++;

             size_two_piv = false;
         }
     }

     //assign number of non-zeros in L to L.nnz_count
     L.nnz_count = count;

 }

 #endif
lil_sparse_matrix::nnz_count
int nnz_count
Number of nonzeros in the matrix.
Definition: lil_sparse_matrix.h:32

block_diag_matrix::off_diagonal
el_type & off_diagonal(int i)
Definition: block_diag_matrix.h:114

lil_sparse_matrix::m_x
vector< elt_vector_type > m_x
The values of the nonzeros in the matrix.
Definition: lil_sparse_matrix.h:36

lil_sparse_matrix::m_idx
vector< idx_vector_type > m_idx
The row/col indices. The way m_idx is used depends on whether the matrix is in LIL-C or LIL-R...
Definition: lil_sparse_matrix.h:35

block_diag_matrix::resize
void resize(int n, el_type default_value)
Resizes this matrix to an n*n matrix with default_value on the main diagonal.
Definition: block_diag_matrix.h:70

lilc_matrix::advance_first
void advance_first(const int &k)
Updates A.first for iteration k.
Definition: lilc_matrix_declarations.h:328

lilc_matrix
A list-of-lists (LIL) matrix in column oriented format.
Definition: lilc_matrix.h:9

block_diag_matrix
A quick implementation of a diagonal matrix with 1x1 and 2x2 blocks.
Definition: block_diag_matrix.h:39

swap_struct
A structure containing variables used in pivoting a LIL-C matrix.
Definition: swap_struct.h:6

lilc_matrix::resize
void resize(int n_rows, int n_cols)
Resizes the matrix. For use in preallocating space before factorization begins.
Definition: lilc_matrix_declarations.h:119

lilc_matrix::list
std::vector< std::vector< int > > list
A list of linked lists that gives the non-zero elements in each row of A. Since at any time we may sw...
Definition: lilc_matrix_declarations.h:44

lilc_matrix::ildl
void ildl(lilc_matrix< el_type > &L, block_diag_matrix< el_type > &D, idx_vector_type &perm, const double &fill_factor, const double &tol, const double &pp_tol, int piv_type=pivot_type::BKP)
Performs an LDL&#39; factorization of this matrix.
Definition: lilc_matrix_ildl.h:10