/* solveT.c */ #include "../SubMtx.h" #define MYDEBUG 0 /*--------------------------------------------------------------------*/ static void real_solveDenseSubrows ( SubMtx *mtxA, SubMtx *mtxB ) ; static void real_solveDenseSubcolumns ( SubMtx *mtxA, SubMtx *mtxB ) ; static void real_solveSparseRows ( SubMtx *mtxA, SubMtx *mtxB ) ; static void real_solveSparseColumns ( SubMtx *mtxA, SubMtx *mtxB ) ; static void complex_solveDenseSubrows ( SubMtx *mtxA, SubMtx *mtxB ) ; static void complex_solveDenseSubcolumns ( SubMtx *mtxA, SubMtx *mtxB ); static void complex_solveSparseRows ( SubMtx *mtxA, SubMtx *mtxB ) ; static void complex_solveSparseColumns ( SubMtx *mtxA, SubMtx *mtxB ) ; /*--------------------------------------------------------------------*/ /* ----------------------------------------------------------------- purpose -- solve (A^T + I) X = B, where (1) X overwrites B (2) A must be strict lower or upper triangular (3) columns(A) = rows(X) (4) rows(A) = rows(B) (5) B has type SUBMTX_DENSE_COLUMNS (6) if A is SUBMTX_DENSE_SUBROWS or SUBMTX_SPARSE_ROWS then A must be strict lower triangular (7) if A is SUBMTX_DENSE_SUBCOLUMNS or SUBMTX_SPARSE_COLUMNS then A must be strict upper triangular created -- 98may01, cca ----------------------------------------------------------------- */ void SubMtx_solveT ( SubMtx *mtxA, SubMtx *mtxB ) { /* --------------- check the input --------------- */ if ( mtxA == NULL || mtxB == NULL ) { fprintf(stderr, "\n fatal error in SubMtx_solveT(%p,%p)" "\n bad input\n", mtxA, mtxB) ; exit(-1) ; } if ( ! SUBMTX_IS_DENSE_COLUMNS(mtxB) ) { fprintf(stderr, "\n fatal error in SubMtx_solveT(%p,%p)" "\n mtxB has bad type %d\n", mtxA, mtxB, mtxB->type) ; exit(-1) ; } if ( mtxA->nrow != mtxB->nrow ) { fprintf(stderr, "\n fatal error in SubMtx_solveT(%p,%p)" "\n mtxA->nrow = %d, mtxB->nrwo = %d\n", mtxA, mtxB, mtxA->nrow, mtxB->nrow) ; exit(-1) ; } /* ------------------------- switch over the type of A ------------------------- */ switch ( mtxA->type ) { case SPOOLES_REAL : /* ------------------------- switch over the mode of A ------------------------- */ switch ( mtxA->mode ) { case SUBMTX_DENSE_SUBROWS : real_solveDenseSubrows(mtxA, mtxB) ; break ; case SUBMTX_SPARSE_ROWS : real_solveSparseRows(mtxA, mtxB) ; break ; case SUBMTX_DENSE_SUBCOLUMNS : real_solveDenseSubcolumns(mtxA, mtxB) ; break ; case SUBMTX_SPARSE_COLUMNS : real_solveSparseColumns(mtxA, mtxB) ; break ; default : fprintf(stderr, "\n fatal error in SubMtx_solveT(%p,%p)" "\n bad mode %d\n", mtxA, mtxB, mtxA->mode) ; exit(-1) ; break ; } break ; case SPOOLES_COMPLEX : /* ------------------------- switch over the mode of A ------------------------- */ switch ( mtxA->mode ) { case SUBMTX_DENSE_SUBROWS : complex_solveDenseSubrows(mtxA, mtxB) ; break ; case SUBMTX_SPARSE_ROWS : complex_solveSparseRows(mtxA, mtxB) ; break ; case SUBMTX_DENSE_SUBCOLUMNS : complex_solveDenseSubcolumns(mtxA, mtxB) ; break ; case SUBMTX_SPARSE_COLUMNS : complex_solveSparseColumns(mtxA, mtxB) ; break ; default : fprintf(stderr, "\n fatal error in SubMtx_solveT(%p,%p)" "\n bad mode %d\n", mtxA, mtxB, mtxA->mode) ; exit(-1) ; break ; } break ; default : fprintf(stderr, "\n fatal error in SubMtx_solveT(%p,%p)" "\n bad type %d\n", mtxA, mtxB, mtxA->type) ; exit(-1) ; break ; } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (A^T + I) X = B, where (1) A is strictly upper triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98feb19, cca --------------------------------------- */ static void real_solveDenseSubcolumns ( SubMtx *mtxA, SubMtx *mtxB ) { double Aki, sum0, sum1, sum2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int first, ii, inc1, inc2, irowA, jcolB, kk, last, ncolB, nentA, nrowA, nrowB ; int *firstlocsA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_denseSubcolumnsInfo(mtxA, &nrowA, &nentA, &firstlocsA, &sizesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; #if MYDEBUG > 0 fprintf(stdout, "\n nentA = %d", nentA) ; fflush(stdout) ; #endif colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + nrowB ; colB2 = colB1 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n %% jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { #if MYDEBUG > 0 fprintf(stdout, "\n %% irowA %d, size %d", irowA, sizesA[irowA]) ; fflush(stdout) ; #endif if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; #if MYDEBUG > 0 fprintf(stdout, ", first %d, last %d", first, last) ; fflush(stdout) ; #endif sum0 = sum1 = sum2 = 0.0 ; for ( ii = first ; ii <= last ; ii++, kk++ ) { Aki = entriesA[kk] ; #if MYDEBUG > 0 fprintf(stdout, "\n %% Aki A(%d,%d) = %12.4e", irowA+1, ii+1, Aki) ; fflush(stdout) ; #endif sum0 += Aki * colB0[ii] ; sum1 += Aki * colB1[ii] ; sum2 += Aki * colB2[ii] ; } colB0[irowA] -= sum0 ; colB1[irowA] -= sum1 ; colB2[irowA] -= sum2 ; } } #if MYDEBUG > 0 fprintf(stdout, "\n %% kk = %d", kk) ; fflush(stdout) ; #endif colB0 = colB2 + nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n %% jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; sum0 = sum1 = 0.0 ; for ( ii = first ; ii <= last ; ii++, kk++ ) { Aki = entriesA[kk] ; sum0 += Aki * colB0[ii] ; sum1 += Aki * colB1[ii] ; } colB0[irowA] -= sum0 ; colB1[irowA] -= sum1 ; } } } else if ( jcolB == ncolB - 1 ) { #if MYDEBUG > 0 fprintf(stdout, "\n %% jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { #if MYDEBUG > 0 fprintf(stdout, "\n %% irowA = %d, kk = %d, sizesA[%d] = %d", irowA, kk, irowA, sizesA[irowA]) ; fflush(stdout) ; #endif if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; #if MYDEBUG > 0 fprintf(stdout, "\n %% first = %d, last = %d", first, last) ; fflush(stdout) ; #endif sum0 = 0.0 ; for ( ii = first ; ii <= last ; ii++, kk++ ) { Aki = entriesA[kk] ; #if MYDEBUG > 0 fprintf(stdout, "\n %% Aki = %12.4e, colB0[%d] = %12.4e", Aki, ii, colB0[ii]) ; fflush(stdout) ; #endif sum0 += Aki * colB0[ii] ; } colB0[irowA] -= sum0 ; #if MYDEBUG > 0 fprintf(stdout, "\n %% colB0[%d] -= %12.4e", irowA, sum0) ; fflush(stdout) ; #endif } } } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (A^T + I) X = B, where (1) A is strictly upper triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98feb19, cca --------------------------------------- */ static void real_solveSparseColumns ( SubMtx *mtxA, SubMtx *mtxB ) { double Aki, sum0, sum1, sum2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int ii, inc1, inc2, irowA, jcolB, jj, kk, ncolB, nentA, nrowA, nrowB, size ; int *indicesA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_sparseColumnsInfo(mtxA, &nrowA, &nentA, &sizesA, &indicesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + nrowB ; colB2 = colB1 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { if ( (size = sizesA[irowA]) > 0 ) { sum0 = sum1 = sum2 = 0.0 ; for ( ii = 0 ; ii < size ; ii++, kk++ ) { Aki = entriesA[kk] ; jj = indicesA[kk] ; if ( jj < 0 || jj >= irowA ) { fprintf(stderr, "\n fatal error, irowA = %d, kk =%d, ii = %d, jj = %d", irowA, kk, ii, jj) ; exit(-1) ; } sum0 += Aki * colB0[jj] ; sum1 += Aki * colB1[jj] ; sum2 += Aki * colB2[jj] ; } colB0[irowA] -= sum0 ; colB1[irowA] -= sum1 ; colB2[irowA] -= sum2 ; } } colB0 = colB2 + nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { if ( (size = sizesA[irowA]) > 0 ) { sum0 = sum1 = 0.0 ; for ( ii = 0 ; ii < size ; ii++, kk++ ) { Aki = entriesA[kk] ; jj = indicesA[kk] ; sum0 += Aki * colB0[jj] ; sum1 += Aki * colB1[jj] ; } colB0[irowA] -= sum0 ; colB1[irowA] -= sum1 ; } } } else if ( jcolB == ncolB - 1 ) { #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { if ( (size = sizesA[irowA]) >= 0 ) { sum0 = 0.0 ; for ( ii = 0 ; ii < size ; ii++, kk++ ) { Aki = entriesA[kk] ; jj = indicesA[kk] ; if ( jj < 0 || jj >= irowA ) { fprintf(stderr, "\n fatal error, irowA = %d, kk =%d, ii = %d, jj = %d", irowA, kk, ii, jj) ; exit(-1) ; } sum0 += Aki * colB0[jj] ; } colB0[irowA] -= sum0 ; } } } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (I + A^T) X = B, where (1) A is strictly lower triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98feb19, cca --------------------------------------- */ static void real_solveDenseSubrows ( SubMtx *mtxA, SubMtx *mtxB ) { double Aji, Bi0, Bi1, Bi2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int colstart, first, inc1, inc2, irowA, jcolB, jj, kk, last, ncolB, nentA, nrowA, nrowB ; int *firstlocsA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_denseSubrowsInfo(mtxA, &nrowA, &nentA, &firstlocsA, &sizesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; #if MYDEBUG > 0 fprintf(stdout, "\n nrowA = %d, ncolA = %d", nrowA, nentA) ; fflush(stdout) ; #endif colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + nrowB ; colB2 = colB1 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = nrowA - 1, colstart = nentA ; irowA >= 0 ; irowA-- ) { if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; colstart -= last - first + 1 ; Bi0 = colB0[irowA] ; Bi1 = colB1[irowA] ; Bi2 = colB2[irowA] ; for ( jj = first, kk = colstart ; jj <= last ; jj++, kk++ ) { Aji = entriesA[kk] ; colB0[jj] -= Aji * Bi0 ; colB1[jj] -= Aji * Bi1 ; colB2[jj] -= Aji * Bi2 ; } } } colB0 = colB2 + nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = nrowA - 1, colstart = nentA ; irowA >= 0 ; irowA-- ) { if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; colstart -= last - first + 1 ; Bi0 = colB0[irowA] ; Bi1 = colB1[irowA] ; for ( jj = first, kk = colstart ; jj <= last ; jj++, kk++ ) { Aji = entriesA[kk] ; colB0[jj] -= Aji * Bi0 ; colB1[jj] -= Aji * Bi1 ; } } } } else if ( jcolB == ncolB - 1 ) { #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = nrowA - 1, colstart = nentA ; irowA >= 0 ; irowA-- ) { #if MYDEBUG > 0 fprintf(stdout, "\n %% irowA = %d, sizesA[%d] = %d", irowA, irowA, sizesA[irowA]) ; fflush(stdout) ; #endif if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; colstart -= last - first + 1 ; Bi0 = colB0[irowA] ; #if MYDEBUG > 0 fprintf(stdout, "\n %% first %d, last %d, colstart %d, Bi0 = %12.4e", first, last, colstart, Bi0) ; fflush(stdout) ; #endif for ( jj = first, kk = colstart ; jj <= last ; jj++, kk++ ) { Aji = entriesA[kk] ; #if MYDEBUG > 0 fprintf(stdout, "\n %% jj %d, kk %d, Aji %12.4e", jj, kk, Aji) ; fflush(stdout) ; #endif colB0[jj] -= Aji * Bi0 ; } } } } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (I + A^T) X = B, where (1) A is strictly lower triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98feb19, cca --------------------------------------- */ static void real_solveSparseRows ( SubMtx *mtxA, SubMtx *mtxB ) { double Aji, Bi0, Bi1, Bi2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int colstart, ii, inc1, inc2, jcolA, jcolB, jj, kk, ncolB, nentA, nrowA, nrowB, size ; int *indicesA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_sparseRowsInfo(mtxA, &nrowA, &nentA, &sizesA, &indicesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; #if MYDEBUG > 0 fprintf(stdout, "\n nrowA = %d, ncolA = %d", nrowA, nentA) ; fflush(stdout) ; #endif colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + nrowB ; colB2 = colB1 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( jcolA = nrowA - 1, colstart = nentA ; jcolA >= 0 ; jcolA-- ) { if ( (size = sizesA[jcolA]) > 0 ) { colstart -= size ; Bi0 = colB0[jcolA] ; Bi1 = colB1[jcolA] ; Bi2 = colB2[jcolA] ; for ( ii = 0, kk = colstart ; ii < size ; ii++, kk++ ) { Aji = entriesA[kk] ; jj = indicesA[kk] ; colB0[jj] -= Aji * Bi0 ; colB1[jj] -= Aji * Bi1 ; colB2[jj] -= Aji * Bi2 ; } } } colB0 = colB2 + nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( jcolA = nrowA - 1, colstart = nentA ; jcolA >= 0 ; jcolA-- ) { if ( (size = sizesA[jcolA]) > 0 ) { colstart -= size ; Bi0 = colB0[jcolA] ; Bi1 = colB1[jcolA] ; for ( ii = 0, kk = colstart ; ii < size ; ii++, kk++ ) { Aji = entriesA[kk] ; jj = indicesA[kk] ; colB0[jj] -= Aji * Bi0 ; colB1[jj] -= Aji * Bi1 ; } } } } else if ( jcolB == ncolB - 1 ) { #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( jcolA = nrowA - 1, colstart = nentA ; jcolA >= 0 ; jcolA-- ) { if ( (size = sizesA[jcolA]) > 0 ) { colstart -= size ; Bi0 = colB0[jcolA] ; for ( ii = 0, kk = colstart ; ii < size ; ii++, kk++ ) { Aji = entriesA[kk] ; jj = indicesA[kk] ; colB0[jj] -= Aji * Bi0 ; } } } } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (A^T + I) X = B, where (1) A is strictly upper triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98may01, cca --------------------------------------- */ static void complex_solveDenseSubcolumns ( SubMtx *mtxA, SubMtx *mtxB ) { double ai, ar, bi0, bi1, bi2, br0, br1, br2, isum0, isum1, isum2, rsum0, rsum1, rsum2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int first, ii, iloc, inc1, inc2, irowA, jcolB, kk, last, ncolB, nentA, nrowA, nrowB, rloc ; int *firstlocsA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_denseSubcolumnsInfo(mtxA, &nrowA, &nentA, &firstlocsA, &sizesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; #if MYDEBUG > 0 fprintf(stdout, "\n nentA = %d", nentA) ; fflush(stdout) ; #endif colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + 2*nrowB ; colB2 = colB1 + 2*nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n %% jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { #if MYDEBUG > 0 fprintf(stdout, "\n %% irowA %d, size %d", irowA, sizesA[irowA]) ; fflush(stdout) ; #endif if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; #if MYDEBUG > 0 fprintf(stdout, ", first %d, last %d", first, last) ; fflush(stdout) ; #endif rsum0 = isum0 = 0.0 ; rsum1 = isum1 = 0.0 ; rsum2 = isum2 = 0.0 ; for ( ii = first ; ii <= last ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; #if MYDEBUG > 0 fprintf(stdout, "\n %% A(%d,%d) = (%12.4e,%12.4e)", irowA+1, ii+1, ar, ai) ; fflush(stdout) ; #endif rloc = 2*ii ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; br2 = colB2[rloc] ; bi2 = colB2[iloc] ; rsum0 += ar*br0 - ai*bi0 ; isum0 += ar*bi0 + ai*br0 ; rsum1 += ar*br1 - ai*bi1 ; isum1 += ar*bi1 + ai*br1 ; rsum2 += ar*br2 - ai*bi2 ; isum2 += ar*bi2 + ai*br2 ; } rloc = 2*irowA ; iloc = rloc + 1 ; colB0[rloc] -= rsum0 ; colB0[iloc] -= isum0 ; colB1[rloc] -= rsum1 ; colB1[iloc] -= isum1 ; colB2[rloc] -= rsum2 ; colB2[iloc] -= isum2 ; } } #if MYDEBUG > 0 fprintf(stdout, "\n %% kk = %d", kk) ; fflush(stdout) ; #endif colB0 = colB2 + 2*nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + 2*nrowB ; for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { #if MYDEBUG > 0 fprintf(stdout, "\n %% irowA %d, size %d", irowA, sizesA[irowA]) ; fflush(stdout) ; #endif if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; #if MYDEBUG > 0 fprintf(stdout, ", first %d, last %d", first, last) ; fflush(stdout) ; #endif rsum0 = isum0 = 0.0 ; rsum1 = isum1 = 0.0 ; for ( ii = first ; ii <= last ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; #if MYDEBUG > 0 fprintf(stdout, "\n %% A(%d,%d) = (%12.4e,%12.4e)", irowA+1, ii+1, ar, ai) ; fflush(stdout) ; #endif rloc = 2*ii ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; rsum0 += ar*br0 - ai*bi0 ; isum0 += ar*bi0 + ai*br0 ; rsum1 += ar*br1 - ai*bi1 ; isum1 += ar*bi1 + ai*br1 ; } rloc = 2*irowA ; iloc = rloc + 1 ; colB0[rloc] -= rsum0 ; colB0[iloc] -= isum0 ; colB1[rloc] -= rsum1 ; colB1[iloc] -= isum1 ; } #if MYDEBUG > 0 fprintf(stdout, "\n %% kk = %d", kk) ; fflush(stdout) ; #endif } } else if ( jcolB == ncolB - 1 ) { for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { #if MYDEBUG > 0 fprintf(stdout, "\n %% irowA %d, size %d", irowA, sizesA[irowA]) ; fflush(stdout) ; #endif if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; #if MYDEBUG > 0 fprintf(stdout, ", first %d, last %d", first, last) ; fflush(stdout) ; #endif rsum0 = isum0 = 0.0 ; for ( ii = first ; ii <= last ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; #if MYDEBUG > 0 fprintf(stdout, "\n %% A(%d,%d) = (%12.4e,%12.4e)", irowA+1, ii+1, ar, ai) ; fflush(stdout) ; #endif rloc = 2*ii ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; rsum0 += ar*br0 - ai*bi0 ; isum0 += ar*bi0 + ai*br0 ; } rloc = 2*irowA ; iloc = rloc + 1 ; colB0[rloc] -= rsum0 ; colB0[iloc] -= isum0 ; } #if MYDEBUG > 0 fprintf(stdout, "\n %% kk = %d", kk) ; fflush(stdout) ; #endif } } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (A^T + I) X = B, where (1) A is strictly upper triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98may01, cca --------------------------------------- */ static void complex_solveSparseColumns ( SubMtx *mtxA, SubMtx *mtxB ) { double ai, ar, bi0, bi1, bi2, br0, br1, br2, isum0, isum1, isum2, rsum0, rsum1, rsum2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int ii, iloc, inc1, inc2, irowA, jcolB, jj, kk, ncolB, nentA, nrowA, nrowB, rloc, size ; int *indicesA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_sparseColumnsInfo(mtxA, &nrowA, &nentA, &sizesA, &indicesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + 2*nrowB ; colB2 = colB1 + 2*nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { if ( (size = sizesA[irowA]) > 0 ) { rsum0 = isum0 = 0.0 ; rsum1 = isum1 = 0.0 ; rsum2 = isum2 = 0.0 ; for ( ii = 0 ; ii < size ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; jj = indicesA[kk] ; if ( jj < 0 || jj >= irowA ) { fprintf(stderr, "\n fatal error, irowA = %d, kk =%d, ii = %d, jj = %d", irowA, kk, ii, jj) ; exit(-1) ; } rloc = 2*jj ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; br2 = colB2[rloc] ; bi2 = colB2[iloc] ; rsum0 += ar*br0 - ai*bi0 ; isum0 += ar*bi0 + ai*br0 ; rsum1 += ar*br1 - ai*bi1 ; isum1 += ar*bi1 + ai*br1 ; rsum2 += ar*br2 - ai*bi2 ; isum2 += ar*bi2 + ai*br2 ; } rloc = 2*irowA ; iloc = rloc + 1 ; colB0[rloc] -= rsum0 ; colB0[iloc] -= isum0 ; colB1[rloc] -= rsum1 ; colB1[iloc] -= isum1 ; colB2[rloc] -= rsum2 ; colB2[iloc] -= isum2 ; } } colB0 = colB2 + 2*nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + 2*nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { if ( (size = sizesA[irowA]) > 0 ) { rsum0 = isum0 = 0.0 ; rsum1 = isum1 = 0.0 ; for ( ii = 0 ; ii < size ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; jj = indicesA[kk] ; if ( jj < 0 || jj >= irowA ) { fprintf(stderr, "\n fatal error, irowA = %d, kk =%d, ii = %d, jj = %d", irowA, kk, ii, jj) ; exit(-1) ; } rloc = 2*jj ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; rsum0 += ar*br0 - ai*bi0 ; isum0 += ar*bi0 + ai*br0 ; rsum1 += ar*br1 - ai*bi1 ; isum1 += ar*bi1 + ai*br1 ; } rloc = 2*irowA ; iloc = rloc + 1 ; colB0[rloc] -= rsum0 ; colB0[iloc] -= isum0 ; colB1[rloc] -= rsum1 ; colB1[iloc] -= isum1 ; } } } else if ( jcolB == ncolB - 1 ) { for ( irowA = kk = 0 ; irowA < nrowA ; irowA++ ) { if ( (size = sizesA[irowA]) > 0 ) { rsum0 = isum0 = 0.0 ; for ( ii = 0 ; ii < size ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; jj = indicesA[kk] ; if ( jj < 0 || jj >= irowA ) { fprintf(stderr, "\n fatal error, irowA = %d, kk =%d, ii = %d, jj = %d", irowA, kk, ii, jj) ; exit(-1) ; } rloc = 2*jj ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; rsum0 += ar*br0 - ai*bi0 ; isum0 += ar*bi0 + ai*br0 ; } rloc = 2*irowA ; iloc = rloc + 1 ; colB0[rloc] -= rsum0 ; colB0[iloc] -= isum0 ; } } } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (I + A^T) X = B, where (1) A is strictly lower triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98may01, cca --------------------------------------- */ static void complex_solveDenseSubrows ( SubMtx *mtxA, SubMtx *mtxB ) { double ai, ar, bi0, bi1, bi2, br0, br1, br2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int colstart, first, iloc, inc1, inc2, irowA, jcolB, jj, kk, last, ncolB, nentA, nrowA, nrowB, rloc ; int *firstlocsA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_denseSubrowsInfo(mtxA, &nrowA, &nentA, &firstlocsA, &sizesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; #if MYDEBUG > 0 fprintf(stdout, "\n nrowA = %d, ncolA = %d", nrowA, nentA) ; fflush(stdout) ; #endif colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + 2*nrowB ; colB2 = colB1 + 2*nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = nrowA - 1, colstart = nentA ; irowA >= 0 ; irowA-- ) { if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; colstart -= last - first + 1 ; rloc = 2*irowA ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; br2 = colB2[rloc] ; bi2 = colB2[iloc] ; for ( jj = first, kk = colstart ; jj <= last ; jj++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; rloc = 2*jj ; iloc = rloc + 1 ; colB0[rloc] -= ar*br0 - ai*bi0 ; colB0[iloc] -= ar*bi0 + ai*br0 ; colB1[rloc] -= ar*br1 - ai*bi1 ; colB1[iloc] -= ar*bi1 + ai*br1 ; colB2[rloc] -= ar*br2 - ai*bi2 ; colB2[iloc] -= ar*bi2 + ai*br2 ; } } } colB0 = colB2 + 2*nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + 2*nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = nrowA - 1, colstart = nentA ; irowA >= 0 ; irowA-- ) { if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; colstart -= last - first + 1 ; rloc = 2*irowA ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; for ( jj = first, kk = colstart ; jj <= last ; jj++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; rloc = 2*jj ; iloc = rloc + 1 ; colB0[rloc] -= ar*br0 - ai*bi0 ; colB0[iloc] -= ar*bi0 + ai*br0 ; colB1[rloc] -= ar*br1 - ai*bi1 ; colB1[iloc] -= ar*bi1 + ai*br1 ; } } } } else if ( jcolB == ncolB - 1 ) { #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( irowA = nrowA - 1, colstart = nentA ; irowA >= 0 ; irowA-- ) { if ( sizesA[irowA] > 0 ) { first = firstlocsA[irowA] ; last = first + sizesA[irowA] - 1 ; colstart -= last - first + 1 ; rloc = 2*irowA ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; for ( jj = first, kk = colstart ; jj <= last ; jj++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; rloc = 2*jj ; iloc = rloc + 1 ; colB0[rloc] -= ar*br0 - ai*bi0 ; colB0[iloc] -= ar*bi0 + ai*br0 ; } } } } return ; } /*--------------------------------------------------------------------*/ /* --------------------------------------- purpose -- solve (I + A^T) X = B, where (1) A is strictly lower triangular (2) X overwrites B (B) B has type SUBMTX_DENSE_COLUMNS created -- 98may01, cca --------------------------------------- */ static void complex_solveSparseRows ( SubMtx *mtxA, SubMtx *mtxB ) { double ai, ar, bi0, bi1, bi2, br0, br1, br2 ; double *colB0, *colB1, *colB2, *entriesA, *entriesB ; int colstart, ii, iloc, inc1, inc2, jcolA, jcolB, jj, kk, ncolB, nentA, nrowA, nrowB, rloc, size ; int *indicesA, *sizesA ; /* ---------------------------------------------------- extract the pointer and dimensions from two matrices ---------------------------------------------------- */ SubMtx_sparseRowsInfo(mtxA, &nrowA, &nentA, &sizesA, &indicesA, &entriesA) ; SubMtx_denseInfo(mtxB, &nrowB, &ncolB, &inc1, &inc2, &entriesB) ; #if MYDEBUG > 0 fprintf(stdout, "\n nrowA = %d, ncolA = %d", nrowA, nentA) ; fflush(stdout) ; #endif colB0 = entriesB ; for ( jcolB = 0 ; jcolB < ncolB - 2 ; jcolB += 3 ) { colB1 = colB0 + 2*nrowB ; colB2 = colB1 + 2*nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( jcolA = nrowA - 1, colstart = nentA ; jcolA >= 0 ; jcolA-- ) { if ( (size = sizesA[jcolA]) > 0 ) { colstart -= size ; rloc = 2*jcolA ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; br2 = colB2[rloc] ; bi2 = colB2[iloc] ; for ( ii = 0, kk = colstart ; ii < size ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; jj = indicesA[kk] ; rloc = 2*jj ; iloc = rloc + 1 ; colB0[rloc] -= ar*br0 - ai*bi0 ; colB0[iloc] -= ar*bi0 + ai*br0 ; colB1[rloc] -= ar*br1 - ai*bi1 ; colB1[iloc] -= ar*bi1 + ai*br1 ; colB2[rloc] -= ar*br2 - ai*bi2 ; colB2[iloc] -= ar*bi2 + ai*br2 ; } } } colB0 = colB2 + 2*nrowB ; } if ( jcolB == ncolB - 2 ) { colB1 = colB0 + 2*nrowB ; #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( jcolA = nrowA - 1, colstart = nentA ; jcolA >= 0 ; jcolA-- ) { if ( (size = sizesA[jcolA]) > 0 ) { colstart -= size ; rloc = 2*jcolA ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; br1 = colB1[rloc] ; bi1 = colB1[iloc] ; for ( ii = 0, kk = colstart ; ii < size ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; jj = indicesA[kk] ; rloc = 2*jj ; iloc = rloc + 1 ; colB0[rloc] -= ar*br0 - ai*bi0 ; colB0[iloc] -= ar*bi0 + ai*br0 ; colB1[rloc] -= ar*br1 - ai*bi1 ; colB1[iloc] -= ar*bi1 + ai*br1 ; } } } } else if ( jcolB == ncolB - 1 ) { #if MYDEBUG > 0 fprintf(stdout, "\n jcolB = %d", jcolB) ; fflush(stdout) ; #endif for ( jcolA = nrowA - 1, colstart = nentA ; jcolA >= 0 ; jcolA-- ) { if ( (size = sizesA[jcolA]) > 0 ) { colstart -= size ; rloc = 2*jcolA ; iloc = rloc + 1 ; br0 = colB0[rloc] ; bi0 = colB0[iloc] ; for ( ii = 0, kk = colstart ; ii < size ; ii++, kk++ ) { ar = entriesA[2*kk] ; ai = entriesA[2*kk+1] ; jj = indicesA[kk] ; rloc = 2*jj ; iloc = rloc + 1 ; colB0[rloc] -= ar*br0 - ai*bi0 ; colB0[iloc] -= ar*bi0 + ai*br0 ; } } } } return ; } /*--------------------------------------------------------------------*/