dgtrfs function
void
dgtrfs(
- String TRANS,
- int N,
- int NRHS,
- Array<
double> DL_, - Array<
double> D_, - Array<
double> DU_, - Array<
double> DLF_, - Array<
double> DF_, - Array<
double> DUF_, - Array<
double> DU2_, - Array<
int> IPIV_, - Matrix<
double> B_, - int LDB,
- Matrix<
double> X_, - int LDX,
- Array<
double> FERR_, - Array<
double> BERR_, - Array<
double> WORK_, - Array<
int> IWORK_, - Box<
int> INFO,
Implementation
void dgtrfs(
final String TRANS,
final int N,
final int NRHS,
final Array<double> DL_,
final Array<double> D_,
final Array<double> DU_,
final Array<double> DLF_,
final Array<double> DF_,
final Array<double> DUF_,
final Array<double> DU2_,
final Array<int> IPIV_,
final Matrix<double> B_,
final int LDB,
final Matrix<double> X_,
final int LDX,
final Array<double> FERR_,
final Array<double> BERR_,
final Array<double> WORK_,
final Array<int> IWORK_,
final Box<int> INFO,
) {
final DL = DL_.having();
final D = D_.having();
final DU = DU_.having();
final DLF = DLF_.having();
final DF = DF_.having();
final DUF = DUF_.having();
final DU2 = DU2_.having();
final IPIV = IPIV_.having();
final B = B_.having(ld: LDB);
final X = X_.having(ld: LDX);
final FERR = FERR_.having();
final BERR = BERR_.having();
final WORK = WORK_.having();
final IWORK = IWORK_.having();
const ITMAX = 5;
const ZERO = 0.0, ONE = 1.0;
const TWO = 2.0;
const THREE = 3.0;
bool NOTRAN;
String TRANSN, TRANST;
int COUNT, I, J, NZ;
double EPS, LSTRES, S, SAFE1, SAFE2, SAFMIN;
final ISAVE = Array<int>(3);
final KASE = Box(0);
// Test the input parameters.
INFO.value = 0;
NOTRAN = lsame(TRANS, 'N');
if (!NOTRAN && !lsame(TRANS, 'T') && !lsame(TRANS, 'C')) {
INFO.value = -1;
} else if (N < 0) {
INFO.value = -2;
} else if (NRHS < 0) {
INFO.value = -3;
} else if (LDB < max(1, N)) {
INFO.value = -13;
} else if (LDX < max(1, N)) {
INFO.value = -15;
}
if (INFO.value != 0) {
xerbla('DGTRFS', -INFO.value);
return;
}
// Quick return if possible
if (N == 0 || NRHS == 0) {
for (J = 1; J <= NRHS; J++) {
FERR[J] = ZERO;
BERR[J] = ZERO;
}
return;
}
if (NOTRAN) {
TRANSN = 'N';
TRANST = 'T';
} else {
TRANSN = 'T';
TRANST = 'N';
}
// NZ = maximum number of nonzero elements in each row of A, plus 1
NZ = 4;
EPS = dlamch('Epsilon');
SAFMIN = dlamch('Safe minimum');
SAFE1 = NZ * SAFMIN;
SAFE2 = SAFE1 / EPS;
// Do for each right hand side
for (J = 1; J <= NRHS; J++) {
COUNT = 1;
LSTRES = THREE;
while (true) {
// Loop until stopping criterion is satisfied.
// Compute residual R = B - op(A) * X,
// where op(A) = A, A**T, or A**H, depending on TRANS.
dcopy(N, B(1, J).asArray(), 1, WORK(N + 1), 1);
dlagtm(TRANS, N, 1, -ONE, DL, D, DU, X(1, J), LDX, ONE,
WORK(N + 1).asMatrix(N), N);
// Compute abs(op(A))*abs(x) + abs(b) for use in the backward
// error bound.
if (NOTRAN) {
if (N == 1) {
WORK[1] = B[1][J].abs() + (D[1] * X[1][J]).abs();
} else {
WORK[1] =
B[1][J].abs() + (D[1] * X[1][J]).abs() + (DU[1] * X[2][J]).abs();
for (I = 2; I <= N - 1; I++) {
WORK[I] = B[I][J].abs() +
(DL[I - 1] * X[I - 1][J]).abs() +
(D[I] * X[I][J]).abs() +
(DU[I] * X[I + 1][J]).abs();
}
WORK[N] = B[N][J].abs() +
(DL[N - 1] * X[N - 1][J]).abs() +
(D[N] * X[N][J]).abs();
}
} else {
if (N == 1) {
WORK[1] = B[1][J].abs() + (D[1] * X[1][J]).abs();
} else {
WORK[1] =
B[1][J].abs() + (D[1] * X[1][J]).abs() + (DL[1] * X[2][J]).abs();
for (I = 2; I <= N - 1; I++) {
WORK[I] = B[I][J].abs() +
(DU[I - 1] * X[I - 1][J]).abs() +
(D[I] * X[I][J]).abs() +
(DL[I] * X[I + 1][J]).abs();
}
WORK[N] = B[N][J].abs() +
(DU[N - 1] * X[N - 1][J]).abs() +
(D[N] * X[N][J]).abs();
}
}
// Compute componentwise relative backward error from formula
// max(i) ( abs(R(i)) / ( abs(op(A))*abs(X) + abs(B) )(i) )
// where abs(Z) is the componentwise absolute value of the matrix
// or vector Z. If the i-th component of the denominator is less
// than SAFE2, then SAFE1 is added to the i-th components of the
// numerator and denominator before dividing.
S = ZERO;
for (I = 1; I <= N; I++) {
if (WORK[I] > SAFE2) {
S = max(S, WORK[N + I].abs() / WORK[I]);
} else {
S = max(S, (WORK[N + I].abs() + SAFE1) / (WORK[I] + SAFE1));
}
}
BERR[J] = S;
// Test stopping criterion. Continue iterating if
// 1) The residual BERR[J] is larger than machine epsilon, and
// 2) BERR[J] decreased by at least a factor of 2 during the
// last iteration, and
// 3) At most ITMAX iterations tried.
if (BERR[J] > EPS && TWO * BERR[J] <= LSTRES && COUNT <= ITMAX) {
// Update solution and try again.
dgttrs(TRANS, N, 1, DLF, DF, DUF, DU2, IPIV, WORK(N + 1).asMatrix(N), N,
INFO);
daxpy(N, ONE, WORK(N + 1), 1, X(1, J).asArray(), 1);
LSTRES = BERR[J];
COUNT++;
continue;
}
break;
}
// Bound error from formula
// norm(X - XTRUE) / norm(X) <= FERR =
// norm( abs(inv(op(A)))*
// ( abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) ))) / norm(X)
// where
// norm(Z) is the magnitude of the largest component of Z
// inv(op(A)) is the inverse of op(A)
// abs(Z) is the componentwise absolute value of the matrix or
// vector Z
// NZ is the maximum number of nonzeros in any row of A, plus 1
// EPS is machine epsilon
// The i-th component of abs(R)+NZ*EPS*(abs(op(A))*abs(X)+abs(B))
// is incremented by SAFE1 if the i-th component of
// abs(op(A))*abs(X) + abs(B) is less than SAFE2.
// Use DLACN2 to estimate the infinity-norm of the matrix
// inv(op(A)) * diag(W),
// where W = abs(R) + NZ*EPS*( abs(op(A))*abs(X)+abs(B) )))
for (I = 1; I <= N; I++) {
if (WORK[I] > SAFE2) {
WORK[I] = WORK[N + I].abs() + NZ * EPS * WORK[I];
} else {
WORK[I] = WORK[N + I].abs() + NZ * EPS * WORK[I] + SAFE1;
}
}
KASE.value = 0;
while (true) {
dlacn2(N, WORK(2 * N + 1), WORK(N + 1), IWORK, FERR.box(J), KASE, ISAVE);
if (KASE.value == 0) break;
if (KASE.value == 1) {
// Multiply by diag(W)*inv(op(A)**T).
dgttrs(TRANST, N, 1, DLF, DF, DUF, DU2, IPIV, WORK(N + 1).asMatrix(N),
N, INFO);
for (I = 1; I <= N; I++) {
WORK[N + I] = WORK[I] * WORK[N + I];
}
} else {
// Multiply by inv(op(A))*diag(W).
for (I = 1; I <= N; I++) {
WORK[N + I] = WORK[I] * WORK[N + I];
}
dgttrs(TRANSN, N, 1, DLF, DF, DUF, DU2, IPIV, WORK(N + 1).asMatrix(N),
N, INFO);
}
}
// Normalize error.
LSTRES = ZERO;
for (I = 1; I <= N; I++) {
LSTRES = max(LSTRES, X[I][J].abs());
}
if (LSTRES != ZERO) FERR[J] /= LSTRES;
}
}