sym-ildl/html/lilc__matrix__ildl__inplace_8h_source.html

 #ifndef _LILC_MATRIX_ILDL_INPLACE_H_
 #define _LILC_MATRIX_ILDL_INPLACE_H_


 using std::endl;
 using std::cout;
 using std::abs;

 template <class el_type>
 void lilc_matrix<el_type> :: ildl_inplace(block_diag_matrix<el_type>& D, idx_vector_type& perm, const double& fill_factor, const double& tol, const double& pp_tol, int piv_type)
 {

     //----------------- initialize temporary variables --------------------//
     const int ncols = n_cols(); //number of cols in A.

     int lfil;
     if (fill_factor > 1e4) lfil = ncols; //just incase users decide to enter a giant fill factor for fun...
     else lfil = 2*fill_factor*nnz()/ncols; //roughly a factor of 2 since only lower tri. of A is stored

     const el_type alpha = (1.0+sqrt(17.0))/8.0;  //for use in pivoting.
     el_type w1(-1), wr(-1), d1(-1), dr(-1);     //for use in bk-pivoting
     el_type det_D, D_inv11, D_inv22, D_inv12;   //for use in 2x2 pivots
     el_type l_11, l_12;                         //for use in 2x2 pivots

     vector<bool> in_set(ncols, false); //bitset used for unsorted merges
     swap_struct<el_type> s; //struct containing temp vars used in pivoting.

     elt_vector_type work(ncols, 0), temp(ncols, 0);
     idx_vector_type curr_nnzs, temp_nnzs;  //non-zeros on current col.
     curr_nnzs.reserve(ncols); //reserves space for worse case (entire col is non-zero)

     int count = 0; //the total number of nonzeros stored in L.
     int i, j, k, r, offset, col_size, col_size2(-1);
     bool size_two_piv = false;  //boolean indicating if the pivot is 2x2 or 1x1

     //--------------- allocate memory for L and D ------------------//
     D.resize(ncols);

     //------------------- main loop: factoring begins -------------------------//
     for (k = 0; k < ncols; k++) {
         //curr nnz vector starts out empty and is cleared at the end of each loop iteration.
         //assign nonzeros indices of A(k:n, k) to curr_nnzs
         curr_nnzs.assign (m_idx[k].begin(), m_idx[k].end());

         //assign nonzero values of A(k:n, k) to work
         for (j = 0; j < (int) curr_nnzs.size(); j++) {
             work[curr_nnzs[j]] = m_x[k][j];
         }
         sort(curr_nnzs.begin(), curr_nnzs.end());

         //--------------begin pivoting--------------//

         //do delayed updates on current column. work = Sum_{i=0}^{k-1} L(k,i) * D(i,i) * L(k:n, i)
         //(the formula above generalizes to block matrix form in the case of 2x2 pivots).
         update(k, work, curr_nnzs, *this, D, in_set);

         //store diagonal element in d1. set diagonal element in work vector to 0
         //since we want to find the maximum off-diagonal element.
         d1 = work[k];
         work[k] = 0;

         //find maximum element in work and store its index in r.
         w1 = max(work, curr_nnzs, r);

         if (piv_type == pivot_type::BKP) {
             //we do partial pivoting here, where we take the first element u in the column that satisfies
             //|u| > pp_tol*|wi|. for more information, consult "A Partial Pivoting Strategy for Sparse
             //Symmetric Matrix Decomposition" by J.H. Liu (1987).
             int t = r; //stores location of u
             el_type u = w1; //stores value of u
             for (i = 0; i < (int) curr_nnzs.size(); i++) {
                 if (abs(work[curr_nnzs[i]])-pp_tol*w1 > eps ) {
                     t = curr_nnzs[i];
                     u = work[t];
                     break;
                 }
             }

             //bunch-kaufman partial pivoting is used below. for a more detailed reference,
             //refer to "Accuracy and Stability of Numerical Algorithms." by Higham (2002).
             //------------------- begin bunch-kaufman pivoting ------------------//
             if (w1 < eps) {
                 //case 0: do nothing. pivot is k.
             } else if ( (alpha * w1 - abs(d1)) < eps  ) {
                 //case 1: do nothing. pivot is k.
             } else {
                 //since we are doing partial pivoting, we should treat u and t like wi and r, so
                 //we'll just reassign wi and r. note: this has to go in the else clause since
                 //we still use the old wi for case 0 and case 1.
                 w1 = u;
                 r = t;

                 offset = row_first[r];
                 //assign all nonzero indices and values in A(r, k:r)
                 //( not including A(r,r) ) to temp and temp_nnzs
                 for (j = offset; j < (int) list[r].size(); j++) {
                     temp_nnzs.push_back(list[r][j]);
                     temp[list[r][j]] = coeff(r, list[r][j]);
                 }

                 //assign nonzero indices of A(r:n, r) to temp_nnzs
                 temp_nnzs.insert(temp_nnzs.end(), m_idx[r].begin(), m_idx[r].end());

                 //assign nonzero values of to temp
                 for (j = 0; j < (int) m_idx[r].size(); j++) {
                     temp[m_idx[r][j]] = m_x[r][j];
                 }

                 //perform delayed updates on temp. temp = Sum_{i=0}^{k-1} L(r,i) * D(i,i) * L(k:n, i).
                 //(the formula above generalizes to block matrix form in the case of 2x2 pivots).
                 update(r, temp, temp_nnzs, *this, D, in_set);

                 dr = temp[r];
                 temp[r] = 0;

                 //find maximum element in temp.
                 wr = max(temp, temp_nnzs, j);

                 if ((alpha*w1*w1 - abs(d1)*wr) < eps) {
                     //case 2: do nothing. pivot is k.

                 } else if ( (alpha * wr - abs(dr)) < eps) {

                     //case 3: pivot is k with r: 1x1 pivot case.
                     temp[r] = dr;
                     work[k] = d1;

                     //--------pivot A ---------//
                     pivotA(s, in_set, k, r);

                     //----------pivot rest ----------//
                     std::swap(d1, dr);

                     //permute perm
                     std::swap(perm[k], perm[r]);

                     work.swap(temp);    //swap work with temp.
                     std::swap(work[k], work[r]); //swap kth and rth row of work

                     curr_nnzs.swap(temp_nnzs);  //swap curr_nnzs with temp_nnzs

                     safe_swap(curr_nnzs, k, r); //swap k and r if they are present in curr_nnzs

                     //--------end pivot rest---------//

                 } else {
                     //case 4: pivot is k+1 with r: 2x2 pivot case.

                     // remote col k for convenience while we are pivoting on col k+1
                     for (int i = 0; i < m_idx[k].size(); i++) {
                         int l = m_idx[k][i];
                         if (l == k) continue;
                         for (int j = row_first[l]; j < list[l].size(); j++) {
                             if (list[l][j] == k) {
                                 std::swap(list[l][j], list[l][list[l].size()-1]);
                                 list[l].pop_back();
                                 break;
                             }
                         }
                     }
                     m_x[k].clear();
                     m_idx[k].clear();
                     col_first[k] = 0;

                     //restore diagonal elements in work and temp
                     temp[r] = dr;
                     work[k] = d1;

                     //indicate that pivot is 2x2
                     size_two_piv = true;

                     if (k+1 < r) {
                         //symmetrically permute row/col k+1 and r.
                         pivotA(s, in_set, k+1, r);

                         //----------pivot rest ----------//

                         //permute perm
                         std::swap(perm[k+1], perm[r]);

                         //swap rows k+1 and r of work and temp
                         std::swap(work[k+1], work[r]);
                         std::swap(temp[k+1], temp[r]);

                         //swap k+1 and r in curr_nnzs and temp_nnzs
                         safe_swap(curr_nnzs, k+1, r);
                         safe_swap(temp_nnzs, k+1, r);
                     }
                 }
             }
             //--------------end bkp pivoting--------------//
         } else if (piv_type == pivot_type::ROOK) {
             //--------------begin rook pivoting--------------//
             i = k;
             work[k] = d1;

             if (alpha * w1 <= abs(d1) + eps) {
                 // do nothing
             } else {
                 while (true) {
                     // assign nonzeros indices and values of A(k:n, r) to col_r_nnzs
                     for (idx_it it = temp_nnzs.begin(); it != temp_nnzs.end(); it++) {
                         temp[*it] = 0;
                     }
                     temp_nnzs.clear();

                     offset = row_first[r];
                     //assign all nonzero indices and values in A(r, k:r)
                     //( not including A(r,r) ) to temp and temp_nnzs
                     for (j = offset; j < (int) list[r].size(); j++) {
                         temp_nnzs.push_back(list[r][j]);
                         temp[list[r][j]] = coeff(r, list[r][j]);
                     }

                     //assign nonzero indices of A(r:n, r) to temp_nnzs
                     temp_nnzs.insert(temp_nnzs.end(), m_idx[r].begin(), m_idx[r].end());

                     //assign nonzero values of to temp
                     for (j = 0; j < (int) m_idx[r].size(); j++) {
                         temp[m_idx[r][j]] = m_x[r][j];
                     }

                     //perform delayed updates on temp. temp = Sum_{i=0}^{k-1} L(r,i) * D(i,i) * L(k:n, i).
                     //(the formula above generalizes to block matrix form in the case of 2x2 pivots).
                     update(r, temp, temp_nnzs, *this, D, in_set);

                     dr = temp[r];
                     temp[r] = 0;

                     //find maximum element in temp.
                     wr = max(temp, temp_nnzs, j);
                     temp[r] = dr;

                     if (alpha * wr <= abs(dr) + eps) {
                         // swap rows and columns k and r
                         this->pivotA(s, in_set, k, r);

                         std::swap(perm[k], perm[r]);

                         std::swap(temp[k], temp[r]);
                         work.swap(temp);

                         safe_swap(temp_nnzs, k, r);
                         curr_nnzs.swap(temp_nnzs);

                         d1 = work[k];
                         break;
                     } else if (abs(w1 - wr) < eps) {
                         size_two_piv = true;
                         // swap rows and columns k and i, k+1 and r
                         if (k != i) {
                             this->pivotA(s, in_set, k, i);

                             std::swap(perm[k], perm[i]);

                             std::swap(work[k], work[i]);
                             std::swap(temp[k], temp[i]);

                             safe_swap(curr_nnzs, k, i);
                             safe_swap(temp_nnzs, k, i);

                             d1 = work[k];
                         }

                         if (k+1 < r) {
                             this->pivotA(s, in_set, k+1, r);

                             std::swap(perm[k+1], perm[r]);

                             std::swap(work[k+1], work[r]);
                             std::swap(temp[k+1], temp[r]);

                             safe_swap(curr_nnzs, k+1, r);
                             safe_swap(temp_nnzs, k+1, r);

                             dr = temp[k+1];
                         }
                         break;
                     } else {
                         i = r;
                         w1 = wr;
                         r = j;
                         work.swap(temp);
                         curr_nnzs.swap(temp_nnzs);
                     }
                 }
             }
             //--------------end rook pivoting--------------//
         }

         //erase diagonal element from non-zero indices (to exclude it from being dropped)
         curr_nnzs.erase(std::remove(curr_nnzs.begin(), curr_nnzs.end(), k), curr_nnzs.end());

         //performs the dual dropping procedure.
         if (!size_two_piv) {
             //perform dual dropping criteria on work
             drop_tol(work, curr_nnzs, lfil, tol);

         } else {
             //erase diagonal 2x2 block from non-zero indices (to exclude it from being dropped)
             temp_nnzs.erase(std::remove(temp_nnzs.begin(), temp_nnzs.end(), k), temp_nnzs.end());
             curr_nnzs.erase(std::remove(curr_nnzs.begin(), curr_nnzs.end(), k+1), curr_nnzs.end());
             temp_nnzs.erase(std::remove(temp_nnzs.begin(), temp_nnzs.end(), k+1), temp_nnzs.end());

             //compute inverse of the 2x2 block diagonal pivot.
             det_D = d1*dr - work[k+1]*work[k+1];
             if ( abs(det_D) < eps) det_D = 1e-6;  //statically pivot;
             D_inv11 = dr/det_D;
             D_inv22 = d1/det_D;
             D_inv12 = -work[k+1]/det_D;

             //assign pivot to D (d1 is assigned to D(k,k) later)
             D.off_diagonal(k) = work[k+1];
             D[k+1] = dr;

             //merge nonzeros of curr and temp together so iterating through them will be easier
             unordered_inplace_union(curr_nnzs, temp_nnzs.begin(), temp_nnzs.end(), in_set);


             //multiply inverse of pivot to work and temp (gives us two columns of l)
             for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
                 l_11 = work[*it]*D_inv11 + temp[*it]*D_inv12;
                 l_12 = work[*it]*D_inv12 + temp[*it]*D_inv22;

                 //note that work and temp roughly share the same non-zero indices
                 work[*it] = l_11;
                 temp[*it] = l_12;
             }

             //since the work and temp non-zero indices are roughly the same,
             //we can copy it over to temp_nnzs
             temp_nnzs.assign(curr_nnzs.begin(), curr_nnzs.end());

             //perform dual dropping procedure on work and temp
             drop_tol(temp, temp_nnzs, lfil, tol);
             drop_tol(work, curr_nnzs, lfil, tol);
         }

         // remove current column for list, and add new column back in (inplace)
         for (i = 0; i < m_idx[k].size(); i++) {
             r = m_idx[k][i];
             if (r == k) continue;
             for (j = row_first[r]; j < list[r].size(); j++) {
                 if (list[r][j] == k) {
                     std::swap(list[r][j], list[r][list[r].size()-1]);
                     list[r].pop_back();
                     break;
                 }
             }
         }

         //resize kth column of L to proper size.
         m_idx[k].resize(curr_nnzs.size()+1);
         m_x[k].resize(curr_nnzs.size()+1);

         //assign diagonal element to D
         D[k] = d1;

         //assign 1s to diagonal of L.
         m_x[k][0] = 1;
         m_idx[k][0] = k;
         count++;

         if (!size_two_piv) {
             if ( abs(D[k]) < eps) D[k] = 1e-6; //statically pivot
             i = 1;

             for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
                 if ( abs(work[*it]) > eps) {
                     m_idx[k][i] = *it; //col k nonzero indices of L are stored
                     m_x[k][i] = work[*it]/D[k]; //col k nonzero values of L are stored

                     list[*it].push_back(k); //update Llist
                     count++;
                     i++;
                 }
             }

             col_size = i;
         } else {
             // remove occurences of current column from list, and add in new column
             for (i = 0; i < m_idx[k+1].size(); i++) {
                 r = m_idx[k+1][i];
                 if (r == k+1) continue;
                 for (j = row_first[r]; j < list[r].size(); j++) {
                     if (list[r][j] == k+1) {
                         std::swap(list[r][j], list[r][list[r].size()-1]);
                         list[r].pop_back();
                         break;
                     }
                 }
             }

             i = 1;
             for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
                 if ( abs(work[*it]) > eps) {
                     m_x[k][i] = work[*it]; //col k nonzero indices of L are stored
                     m_idx[k][i] = *it; //col k nonzero values of L are stored

                     list[*it].push_back(k); //update Llist
                     count++;
                     i++;
                 }

             }

             //resize k+1th column of L to proper size.
             m_idx[k+1].resize(temp_nnzs.size()+1);
             m_x[k+1].resize(temp_nnzs.size()+1);

             //assign 1s to diagonal of L.
             m_x[k+1][0] = 1;
             m_idx[k+1][0] = k+1;
             count++;

             j = 1;
             for (idx_it it = temp_nnzs.begin(); it != temp_nnzs.end(); it++) {
                 if ( abs(temp[*it]) > eps) {
                     m_x[k+1][j] = temp[*it]; //col k+1 nonzero indices of L are stored
                     m_idx[k+1][j] = *it; //col k+1 nonzero values of L are stored

                     list[*it].push_back(k+1); //update Llist
                     count++;
                     j++;
                 }

             }

             col_size = i;
             col_size2 = j;
         }

         // ------------- reset temp and work back to zero -----------------//
         work[k] = 0;
         temp[k] = 0;

         if (k + 1 < ncols) {
             temp[k+1] = 0;
             work[k+1] = 0;
         }

         for (idx_it it = curr_nnzs.begin(); it != curr_nnzs.end(); it++) {
             work[*it] = 0;
         }
         curr_nnzs.clear(); //zero out work vector

         for (idx_it it = temp_nnzs.begin(); it != temp_nnzs.end(); it++) {
             temp[*it] = 0;
         }
         temp_nnzs.clear(); //zero out work vector

         //-------------------------------------------------------------------//

         //resize columns of L to correct size
         m_x[k].resize(col_size);
         m_idx[k].resize(col_size);

         //update list and L.first
         col_first[k] = 1;
         advance_list(k);
         advance_first(k);

         if (size_two_piv) {
             m_x[k+1].resize(col_size2);
             m_idx[k+1].resize(col_size2);

             col_first[k+1] = 1;
             advance_first(k+1);
             advance_list(k+1);

             k++;

             size_two_piv = false;
         }
     }

     //assign number of non-zeros in L to L.nnz_count
     this->nnz_count = count;
 }

 #endif
block_diag_matrix::off_diagonal
el_type & off_diagonal(int i)
Definition: block_diag_matrix.h:114

lilc_matrix::ildl_inplace
void ildl_inplace(block_diag_matrix< el_type > &D, idx_vector_type &perm, const double &fill_factor, const double &tol, const double &pp_tol, int piv_type=pivot_type::BKP)
Performs an inplace LDL&#39; factorization of this matrix.
Definition: lilc_matrix_ildl_inplace.h:10

block_diag_matrix::resize
void resize(int n, el_type default_value)
Resizes this matrix to an n*n matrix with default_value on the main diagonal.
Definition: block_diag_matrix.h:70

block_diag_matrix
A quick implementation of a diagonal matrix with 1x1 and 2x2 blocks.
Definition: block_diag_matrix.h:39

swap_struct
A structure containing variables used in pivoting a LIL-C matrix.
Definition: swap_struct.h:6