Mercurial > forge
diff main/sparse/SuperLU/SRC/zgssvx.c @ 0:6b33357c7561 octave-forge
Initial revision
author | pkienzle |
---|---|
date | Wed, 10 Oct 2001 19:54:49 +0000 |
parents | |
children | 7dad48fc229c |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/main/sparse/SuperLU/SRC/zgssvx.c Wed Oct 10 19:54:49 2001 +0000 @@ -0,0 +1,624 @@ + + +/* + * -- SuperLU routine (version 2.0) -- + * Univ. of California Berkeley, Xerox Palo Alto Research Center, + * and Lawrence Berkeley National Lab. + * November 15, 1997 + * + */ +#include "zsp_defs.h" +#include "util.h" + +void +zgssvx(char *fact, char *trans, char *refact, + SuperMatrix *A, factor_param_t *factor_params, int *perm_c, + int *perm_r, int *etree, char *equed, double *R, double *C, + SuperMatrix *L, SuperMatrix *U, void *work, int lwork, + SuperMatrix *B, SuperMatrix *X, double *recip_pivot_growth, + double *rcond, double *ferr, double *berr, + mem_usage_t *mem_usage, int *info ) +{ +/* + * Purpose + * ======= + * + * ZGSSVX solves the system of linear equations A*X=B or A'*X=B, using + * the LU factorization from zgstrf(). Error bounds on the solution and + * a condition estimate are also provided. It performs the following steps: + * + * 1. If A is stored column-wise (A->Stype = NC): + * + * 1.1. If fact = 'E', scaling factors are computed to equilibrate the + * system: + * trans = 'N': diag(R)*A*diag(C) *inv(diag(C))*X = diag(R)*B + * trans = 'T': (diag(R)*A*diag(C))**T *inv(diag(R))*X = diag(C)*B + * trans = 'C': (diag(R)*A*diag(C))**H *inv(diag(R))*X = diag(C)*B + * Whether or not the system will be equilibrated depends on the + * scaling of the matrix A, but if equilibration is used, A is + * overwritten by diag(R)*A*diag(C) and B by diag(R)*B (if trans='N') + * or diag(C)*B (if trans = 'T' or 'C'). + * + * 1.2. Permute columns of A, forming A*Pc, where Pc is a permutation + * matrix that usually preserves sparsity. + * For more details of this step, see sp_preorder.c. + * + * 1.3. If fact = 'N' or 'E', the LU decomposition is used to factor the + * matrix A (after equilibration if fact = 'E') as Pr*A*Pc = L*U, + * with Pr determined by partial pivoting. + * + * 1.4. Compute the reciprocal pivot growth factor. + * + * 1.5. If some U(i,i) = 0, so that U is exactly singular, then the + * routine returns with info = i. Otherwise, the factored form of + * A is used to estimate the condition number of the matrix A. If + * the reciprocal of the condition number is less than machine + * precision, info = A->ncol+1 is returned as a warning, but the + * routine still goes on to solve for X and computes error bounds + * as described below. + * + * 1.6. The system of equations is solved for X using the factored form + * of A. + * + * 1.7. Iterative refinement is applied to improve the computed solution + * matrix and calculate error bounds and backward error estimates + * for it. + * + * 1.8. If equilibration was used, the matrix X is premultiplied by + * diag(C) (if trans = 'N') or diag(R) (if trans = 'T' or 'C') so + * that it solves the original system before equilibration. + * + * 2. If A is stored row-wise (A->Stype = NR), apply the above algorithm + * to the transpose of A: + * + * 2.1. If fact = 'E', scaling factors are computed to equilibrate the + * system: + * trans = 'N': diag(R)*A'*diag(C) *inv(diag(C))*X = diag(R)*B + * trans = 'T': (diag(R)*A'*diag(C))**T *inv(diag(R))*X = diag(C)*B + * trans = 'C': (diag(R)*A'*diag(C))**H *inv(diag(R))*X = diag(C)*B + * Whether or not the system will be equilibrated depends on the + * scaling of the matrix A, but if equilibration is used, A' is + * overwritten by diag(R)*A'*diag(C) and B by diag(R)*B + * (if trans='N') or diag(C)*B (if trans = 'T' or 'C'). + * + * 2.2. Permute columns of transpose(A) (rows of A), + * forming transpose(A)*Pc, where Pc is a permutation matrix that + * usually preserves sparsity. + * For more details of this step, see sp_preorder.c. + * + * 2.3. If fact = 'N' or 'E', the LU decomposition is used to factor the + * transpose(A) (after equilibration if fact = 'E') as + * Pr*transpose(A)*Pc = L*U with the permutation Pr determined by + * partial pivoting. + * + * 2.4. Compute the reciprocal pivot growth factor. + * + * 2.5. If some U(i,i) = 0, so that U is exactly singular, then the + * routine returns with info = i. Otherwise, the factored form + * of transpose(A) is used to estimate the condition number of the + * matrix A. If the reciprocal of the condition number + * is less than machine precision, info = A->nrow+1 is returned as + * a warning, but the routine still goes on to solve for X and + * computes error bounds as described below. + * + * 2.6. The system of equations is solved for X using the factored form + * of transpose(A). + * + * 2.7. Iterative refinement is applied to improve the computed solution + * matrix and calculate error bounds and backward error estimates + * for it. + * + * 2.8. If equilibration was used, the matrix X is premultiplied by + * diag(C) (if trans = 'N') or diag(R) (if trans = 'T' or 'C') so + * that it solves the original system before equilibration. + * + * See supermatrix.h for the definition of 'SuperMatrix' structure. + * + * Arguments + * ========= + * + * fact (input) char* + * Specifies whether or not the factored form of the matrix + * A is supplied on entry, and if not, whether the matrix A should + * be equilibrated before it is factored. + * = 'F': On entry, L, U, perm_r and perm_c contain the factored + * form of A. If equed is not 'N', the matrix A has been + * equilibrated with scaling factors R and C. + * A, L, U, perm_r are not modified. + * = 'N': The matrix A will be factored, and the factors will be + * stored in L and U. + * = 'E': The matrix A will be equilibrated if necessary, then + * factored into L and U. + * + * trans (input) char* + * Specifies the form of the system of equations: + * = 'N': A * X = B (No transpose) + * = 'T': A**T * X = B (Transpose) + * = 'C': A**H * X = B (Transpose) + * + * refact (input) char* + * Specifies whether we want to re-factor the matrix. + * = 'N': Factor the matrix A. + * = 'Y': Matrix A was factored before, now we want to re-factor + * matrix A with perm_r and etree as inputs. Use + * the same storage for the L\U factors previously allocated, + * expand it if necessary. User should insure to use the same + * memory model. + * If fact = 'F', then refact is not accessed. + * + * A (input/output) SuperMatrix* + * Matrix A in A*X=B, of dimension (A->nrow, A->ncol). The number + * of the linear equations is A->nrow. Currently, the type of A can be: + * Stype = NC or NR, Dtype = _Z, Mtype = GE. In the future, + * more general A can be handled. + * + * On entry, If fact = 'F' and equed is not 'N', then A must have + * been equilibrated by the scaling factors in R and/or C. + * A is not modified if fact = 'F' or 'N', or if fact = 'E' and + * equed = 'N' on exit. + * + * On exit, if fact = 'E' and equed is not 'N', A is scaled as follows: + * If A->Stype = NC: + * equed = 'R': A := diag(R) * A + * equed = 'C': A := A * diag(C) + * equed = 'B': A := diag(R) * A * diag(C). + * If A->Stype = NR: + * equed = 'R': transpose(A) := diag(R) * transpose(A) + * equed = 'C': transpose(A) := transpose(A) * diag(C) + * equed = 'B': transpose(A) := diag(R) * transpose(A) * diag(C). + * + * factor_params (input) factor_param_t* + * The structure defines the input scalar parameters, consisting of + * the following fields. If factor_params = NULL, the default + * values are used for all the fields; otherwise, the values + * are given by the user. + * - panel_size (int): Panel size. A panel consists of at most + * panel_size consecutive columns. If panel_size = -1, use + * default value 8. + * - relax (int): To control degree of relaxing supernodes. If the + * number of nodes (columns) in a subtree of the elimination + * tree is less than relax, this subtree is considered as one + * supernode, regardless of the row structures of those columns. + * If relax = -1, use default value 8. + * - diag_pivot_thresh (double): Diagonal pivoting threshold. + * At step j of the Gaussian elimination, if + * abs(A_jj) >= diag_pivot_thresh * (max_(i>=j) abs(A_ij)), + * then use A_jj as pivot. 0 <= diag_pivot_thresh <= 1. + * If diag_pivot_thresh = -1, use default value 1.0, + * which corresponds to standard partial pivoting. + * - drop_tol (double): Drop tolerance threshold. (NOT IMPLEMENTED) + * At step j of the Gaussian elimination, if + * abs(A_ij)/(max_i abs(A_ij)) < drop_tol, + * then drop entry A_ij. 0 <= drop_tol <= 1. + * If drop_tol = -1, use default value 0.0, which corresponds to + * standard Gaussian elimination. + * + * perm_c (input/output) int* + * If A->Stype = NC, Column permutation vector of size A->ncol, + * which defines the permutation matrix Pc; perm_c[i] = j means + * column i of A is in position j in A*Pc. + * On exit, perm_c may be overwritten by the product of the input + * perm_c and a permutation that postorders the elimination tree + * of Pc'*A'*A*Pc; perm_c is not changed if the elimination tree + * is already in postorder. + * + * If A->Stype = NR, column permutation vector of size A->nrow, + * which describes permutation of columns of transpose(A) + * (rows of A) as described above. + * + * perm_r (input/output) int* + * If A->Stype = NC, row permutation vector of size A->nrow, + * which defines the permutation matrix Pr, and is determined + * by partial pivoting. perm_r[i] = j means row i of A is in + * position j in Pr*A. + * + * If A->Stype = NR, permutation vector of size A->ncol, which + * determines permutation of rows of transpose(A) + * (columns of A) as described above. + * + * If refact is not 'Y', perm_r is output argument; + * If refact = 'Y', the pivoting routine will try to use the input + * perm_r, unless a certain threshold criterion is violated. + * In that case, perm_r is overwritten by a new permutation + * determined by partial pivoting or diagonal threshold pivoting. + * + * etree (input/output) int*, dimension (A->ncol) + * Elimination tree of Pc'*A'*A*Pc. + * If fact is not 'F' and refact = 'Y', etree is an input argument, + * otherwise it is an output argument. + * Note: etree is a vector of parent pointers for a forest whose + * vertices are the integers 0 to A->ncol-1; etree[root]==A->ncol. + * + * equed (input/output) char* + * Specifies the form of equilibration that was done. + * = 'N': No equilibration. + * = 'R': Row equilibration, i.e., A was premultiplied by diag(R). + * = 'C': Column equilibration, i.e., A was postmultiplied by diag(C). + * = 'B': Both row and column equilibration, i.e., A was replaced + * by diag(R)*A*diag(C). + * If fact = 'F', equed is an input argument, otherwise it is + * an output argument. + * + * R (input/output) double*, dimension (A->nrow) + * The row scale factors for A or transpose(A). + * If equed = 'R' or 'B', A (if A->Stype = NC) or transpose(A) (if + * A->Stype = NR) is multiplied on the left by diag(R). + * If equed = 'N' or 'C', R is not accessed. + * If fact = 'F', R is an input argument; otherwise, R is output. + * If fact = 'F' and equed = 'R' or 'B', each element of R must + * be positive. + * + * C (input/output) double*, dimension (A->ncol) + * The column scale factors for A or transpose(A). + * If equed = 'C' or 'B', A (if A->Stype = NC) or transpose(A) (if + * A->Stype = NR) is multiplied on the right by diag(C). + * If equed = 'N' or 'R', C is not accessed. + * If fact = 'F', C is an input argument; otherwise, C is output. + * If fact = 'F' and equed = 'C' or 'B', each element of C must + * be positive. + * + * L (output) SuperMatrix* + * The factor L from the factorization + * Pr*A*Pc=L*U (if A->Stype = NC) or + * Pr*transpose(A)*Pc=L*U (if A->Stype = NR). + * Uses compressed row subscripts storage for supernodes, i.e., + * L has types: Stype = SC, Dtype = _Z, Mtype = TRLU. + * + * U (output) SuperMatrix* + * The factor U from the factorization + * Pr*A*Pc=L*U (if A->Stype = NC) or + * Pr*transpose(A)*Pc=L*U (if A->Stype = NR). + * Uses column-wise storage scheme, i.e., U has types: + * Stype = NC, Dtype = _Z, Mtype = TRU. + * + * work (workspace/output) void*, size (lwork) (in bytes) + * User supplied workspace, should be large enough + * to hold data structures for factors L and U. + * On exit, if fact is not 'F', L and U point to this array. + * + * lwork (input) int + * Specifies the size of work array in bytes. + * = 0: allocate space internally by system malloc; + * > 0: use user-supplied work array of length lwork in bytes, + * returns error if space runs out. + * = -1: the routine guesses the amount of space needed without + * performing the factorization, and returns it in + * mem_usage->total_needed; no other side effects. + * + * See argument 'mem_usage' for memory usage statistics. + * + * B (input/output) SuperMatrix* + * B has types: Stype = DN, Dtype = _Z, Mtype = GE. + * On entry, the right hand side matrix. + * On exit, + * if equed = 'N', B is not modified; otherwise + * if A->Stype = NC: + * if trans = 'N' and equed = 'R' or 'B', B is overwritten by + * diag(R)*B; + * if trans = 'T' or 'C' and equed = 'C' of 'B', B is + * overwritten by diag(C)*B; + * if A->Stype = NR: + * if trans = 'N' and equed = 'C' or 'B', B is overwritten by + * diag(C)*B; + * if trans = 'T' or 'C' and equed = 'R' of 'B', B is + * overwritten by diag(R)*B. + * + * X (output) SuperMatrix* + * X has types: Stype = DN, Dtype = _Z, Mtype = GE. + * If info = 0 or info = A->ncol+1, X contains the solution matrix + * to the original system of equations. Note that A and B are modified + * on exit if equed is not 'N', and the solution to the equilibrated + * system is inv(diag(C))*X if trans = 'N' and equed = 'C' or 'B', + * or inv(diag(R))*X if trans = 'T' or 'C' and equed = 'R' or 'B'. + * + * recip_pivot_growth (output) double* + * The reciprocal pivot growth factor max_j( norm(A_j)/norm(U_j) ). + * The infinity norm is used. If recip_pivot_growth is much less + * than 1, the stability of the LU factorization could be poor. + * + * rcond (output) double* + * The estimate of the reciprocal condition number of the matrix A + * after equilibration (if done). If rcond is less than the machine + * precision (in particular, if rcond = 0), the matrix is singular + * to working precision. This condition is indicated by a return + * code of info > 0. + * + * FERR (output) double*, dimension (B->ncol) + * The estimated forward error bound for each solution vector + * X(j) (the j-th column of the solution matrix X). + * If XTRUE is the true solution corresponding to X(j), FERR(j) + * is an estimated upper bound for the magnitude of the largest + * element in (X(j) - XTRUE) divided by the magnitude of the + * largest element in X(j). The estimate is as reliable as + * the estimate for RCOND, and is almost always a slight + * overestimate of the true error. + * + * BERR (output) double*, dimension (B->ncol) + * The componentwise relative backward error of each solution + * vector X(j) (i.e., the smallest relative change in + * any element of A or B that makes X(j) an exact solution). + * + * mem_usage (output) mem_usage_t* + * Record the memory usage statistics, consisting of following fields: + * - for_lu (float) + * The amount of space used in bytes for L\U data structures. + * - total_needed (float) + * The amount of space needed in bytes to perform factorization. + * - expansions (int) + * The number of memory expansions during the LU factorization. + * + * info (output) int* + * = 0: successful exit + * < 0: if info = -i, the i-th argument had an illegal value + * > 0: if info = i, and i is + * <= A->ncol: U(i,i) is exactly zero. The factorization has + * been completed, but the factor U is exactly + * singular, so the solution and error bounds + * could not be computed. + * = A->ncol+1: U is nonsingular, but RCOND is less than machine + * precision, meaning that the matrix is singular to + * working precision. Nevertheless, the solution and + * error bounds are computed because there are a number + * of situations where the computed solution can be more + * accurate than the value of RCOND would suggest. + * > A->ncol+1: number of bytes allocated when memory allocation + * failure occurred, plus A->ncol. + * + */ + + DNformat *Bstore, *Xstore; + doublecomplex *Bmat, *Xmat; + int ldb, ldx, nrhs; + SuperMatrix *AA; /* A in NC format used by the factorization routine.*/ + SuperMatrix AC; /* Matrix postmultiplied by Pc */ + int colequ, equil, nofact, notran, rowequ; + char trant[1], norm[1]; + int i, j, info1; + double amax, anorm, bignum, smlnum, colcnd, rowcnd, rcmax, rcmin; + int relax, panel_size; + double diag_pivot_thresh, drop_tol; + double t0; /* temporary time */ + double *utime; + extern SuperLUStat_t SuperLUStat; + + /* External functions */ + extern double zlangs(char *, SuperMatrix *); + extern double dlamch_(char *); + + Bstore = B->Store; + Xstore = X->Store; + Bmat = Bstore->nzval; + Xmat = Xstore->nzval; + ldb = Bstore->lda; + ldx = Xstore->lda; + nrhs = B->ncol; + +#if 0 +printf("zgssvx: fact=%c, trans=%c, refact=%c, equed=%c\n", + *fact, *trans, *refact, *equed); +#endif + + *info = 0; + nofact = lsame_(fact, "N"); + equil = lsame_(fact, "E"); + notran = lsame_(trans, "N"); + if (nofact || equil) { + *(unsigned char *)equed = 'N'; + rowequ = FALSE; + colequ = FALSE; + } else { + rowequ = lsame_(equed, "R") || lsame_(equed, "B"); + colequ = lsame_(equed, "C") || lsame_(equed, "B"); + smlnum = dlamch_("Safe minimum"); + bignum = 1. / smlnum; + } + + /* Test the input parameters */ + if (!nofact && !equil && !lsame_(fact, "F")) *info = -1; + else if (!notran && !lsame_(trans, "T") && !lsame_(trans, "C")) *info = -2; + else if ( !(lsame_(refact,"Y") || lsame_(refact, "N")) ) *info = -3; + else if ( A->nrow != A->ncol || A->nrow < 0 || + (A->Stype != NC && A->Stype != NR) || + A->Dtype != _Z || A->Mtype != GE ) + *info = -4; + else if (lsame_(fact, "F") && !(rowequ || colequ || lsame_(equed, "N"))) + *info = -9; + else { + if (rowequ) { + rcmin = bignum; + rcmax = 0.; + for (j = 0; j < A->nrow; ++j) { + rcmin = MIN(rcmin, R[j]); + rcmax = MAX(rcmax, R[j]); + } + if (rcmin <= 0.) *info = -10; + else if ( A->nrow > 0) + rowcnd = MAX(rcmin,smlnum) / MIN(rcmax,bignum); + else rowcnd = 1.; + } + if (colequ && *info == 0) { + rcmin = bignum; + rcmax = 0.; + for (j = 0; j < A->nrow; ++j) { + rcmin = MIN(rcmin, C[j]); + rcmax = MAX(rcmax, C[j]); + } + if (rcmin <= 0.) *info = -11; + else if (A->nrow > 0) + colcnd = MAX(rcmin,smlnum) / MIN(rcmax,bignum); + else colcnd = 1.; + } + if (*info == 0) { + if ( lwork < -1 ) *info = -15; + else if ( B->ncol < 0 || Bstore->lda < MAX(0, A->nrow) || + B->Stype != DN || B->Dtype != _Z || + B->Mtype != GE ) + *info = -16; + else if ( X->ncol < 0 || Xstore->lda < MAX(0, A->nrow) || + B->ncol != X->ncol || X->Stype != DN || + X->Dtype != _Z || X->Mtype != GE ) + *info = -17; + } + } + if (*info != 0) { + i = -(*info); + xerbla_("zgssvx", &i); + return; + } + + /* Default values for factor_params */ + panel_size = sp_ienv(1); + relax = sp_ienv(2); + diag_pivot_thresh = 1.0; + drop_tol = 0.0; + if ( factor_params != NULL ) { + if ( factor_params->panel_size != -1 ) + panel_size = factor_params->panel_size; + if ( factor_params->relax != -1 ) relax = factor_params->relax; + if ( factor_params->diag_pivot_thresh != -1 ) + diag_pivot_thresh = factor_params->diag_pivot_thresh; + if ( factor_params->drop_tol != -1 ) + drop_tol = factor_params->drop_tol; + } + + StatInit(panel_size, relax); + utime = SuperLUStat.utime; + + /* Convert A to NC format when necessary. */ + if ( A->Stype == NR ) { + NRformat *Astore = A->Store; + AA = (SuperMatrix *) SUPERLU_MALLOC( sizeof(SuperMatrix) ); + zCreate_CompCol_Matrix(AA, A->ncol, A->nrow, Astore->nnz, + Astore->nzval, Astore->colind, Astore->rowptr, + NC, A->Dtype, A->Mtype); + if ( notran ) { /* Reverse the transpose argument. */ + *trant = 'T'; + notran = 0; + } else { + *trant = 'N'; + notran = 1; + } + } else { /* A->Stype == NC */ + *trant = *trans; + AA = A; + } + + if ( equil ) { + t0 = SuperLU_timer_(); + /* Compute row and column scalings to equilibrate the matrix A. */ + zgsequ(AA, R, C, &rowcnd, &colcnd, &amax, &info1); + + if ( info1 == 0 ) { + /* Equilibrate matrix A. */ + zlaqgs(AA, R, C, rowcnd, colcnd, amax, equed); + rowequ = lsame_(equed, "R") || lsame_(equed, "B"); + colequ = lsame_(equed, "C") || lsame_(equed, "B"); + } + utime[EQUIL] = SuperLU_timer_() - t0; + } + + /* Scale the right hand side if equilibration was performed. */ + if ( notran ) { + if ( rowequ ) { + for (j = 0; j < nrhs; ++j) + for (i = 0; i < A->nrow; ++i) { + zd_mult(&Bmat[i + j*ldb], &Bmat[i + j*ldb], R[i]); + } + } + } else if ( colequ ) { + for (j = 0; j < nrhs; ++j) + for (i = 0; i < A->nrow; ++i) { + zd_mult(&Bmat[i + j*ldb], &Bmat[i + j*ldb], C[i]); + } + } + + if ( nofact || equil ) { + + t0 = SuperLU_timer_(); + sp_preorder(refact, AA, perm_c, etree, &AC); + utime[ETREE] = SuperLU_timer_() - t0; + +/* printf("Factor PA = LU ... relax %d\tw %d\tmaxsuper %d\trowblk %d\n", + relax, panel_size, sp_ienv(3), sp_ienv(4)); + fflush(stdout); */ + + /* Compute the LU factorization of A*Pc. */ + t0 = SuperLU_timer_(); + zgstrf(refact, &AC, diag_pivot_thresh, drop_tol, relax, panel_size, + etree, work, lwork, perm_r, perm_c, L, U, info); + utime[FACT] = SuperLU_timer_() - t0; + + if ( lwork == -1 ) { + mem_usage->total_needed = *info - A->ncol; + return; + } + } + + if ( *info > 0 ) { + if ( *info <= A->ncol ) { + /* Compute the reciprocal pivot growth factor of the leading + rank-deficient *info columns of A. */ + *recip_pivot_growth = zPivotGrowth(*info, AA, perm_c, L, U); + } + return; + } + + /* Compute the reciprocal pivot growth factor *recip_pivot_growth. */ + *recip_pivot_growth = zPivotGrowth(A->ncol, AA, perm_c, L, U); + + /* Estimate the reciprocal of the condition number of A. */ + t0 = SuperLU_timer_(); + if ( notran ) { + *(unsigned char *)norm = '1'; + } else { + *(unsigned char *)norm = 'I'; + } + anorm = zlangs(norm, AA); + zgscon(norm, L, U, anorm, rcond, info); + utime[RCOND] = SuperLU_timer_() - t0; + + /* Compute the solution matrix X. */ + for (j = 0; j < nrhs; j++) /* Save a copy of the right hand sides */ + for (i = 0; i < B->nrow; i++) + Xmat[i + j*ldx] = Bmat[i + j*ldb]; + + t0 = SuperLU_timer_(); + zgstrs (trant, L, U, perm_r, perm_c, X, info); + utime[SOLVE] = SuperLU_timer_() - t0; + + /* Use iterative refinement to improve the computed solution and compute + error bounds and backward error estimates for it. */ + t0 = SuperLU_timer_(); + zgsrfs(trant, AA, L, U, perm_r, perm_c, equed, R, C, B, + X, ferr, berr, info); + utime[REFINE] = SuperLU_timer_() - t0; + + /* Transform the solution matrix X to a solution of the original system. */ + if ( notran ) { + if ( colequ ) { + for (j = 0; j < nrhs; ++j) + for (i = 0; i < A->nrow; ++i) { + zd_mult(&Xmat[i + j*ldx], &Xmat[i + j*ldx], C[i]); + } + } + } else if ( rowequ ) { + for (j = 0; j < nrhs; ++j) + for (i = 0; i < A->nrow; ++i) { + zd_mult(&Xmat[i+ j*ldx], &Xmat[i+ j*ldx], R[i]); + } + } + + /* Set INFO = A->ncol+1 if the matrix is singular to working precision. */ + if ( *rcond < dlamch_("E") ) *info = A->ncol + 1; + + zQuerySpace(L, U, panel_size, mem_usage); + + if ( nofact || equil ) Destroy_CompCol_Permuted(&AC); + if ( A->Stype == NR ) { + Destroy_SuperMatrix_Store(AA); + SUPERLU_FREE(AA); + } + + PrintStat( &SuperLUStat ); + StatFree(); +}