/*********************************************************/
/* TAUCS                                                 */
/* Author: Sivan Toledo                                  */
/*********************************************************/

#include <stdio.h>
#include <stdlib.h>
#include <assert.h>
#include <math.h>
#include "taucs.h"

#ifndef TAUCS_CORE
#error "You must define TAUCS_CORE to compile this file"
#endif

/*********************************************************/
/* split into left, right columns                        */
/*********************************************************/

#ifdef TAUCS_CORE_GENERAL
void 
taucs_ccs_split(taucs_ccs_matrix*  A, 
		taucs_ccs_matrix** L, 
		taucs_ccs_matrix** R, 
		int p)
{

#ifdef TAUCS_DOUBLE_IN_BUILD
  if (A->flags & TAUCS_DOUBLE)
    taucs_dccs_split(A,L,R,p);
#endif

#ifdef TAUCS_SINGLE_IN_BUILD
  if (A->flags & TAUCS_SINGLE)
    taucs_sccs_split(A,L,R,p);
#endif

#ifdef TAUCS_DCOMPLEX_IN_BUILD
  if (A->flags & TAUCS_DCOMPLEX)
    taucs_zccs_split(A,L,R,p);
#endif

#ifdef TAUCS_SCOMPLEX_IN_BUILD
  if (A->flags & TAUCS_SCOMPLEX)
    taucs_cccs_split(A,L,R,p);
#endif
  
  
}
#endif /*TAUCS_CORE_GENERAL*/

#ifndef TAUCS_CORE_GENERAL

/* split into left p columns, right p columns */
void 
taucs_dtl(ccs_split)(taucs_ccs_matrix*  A, 
		     taucs_ccs_matrix** L, 
		     taucs_ccs_matrix** R, 
		     int p)
{
  int i,n;
  int Lnnz, Rnnz;

  assert((A->flags & TAUCS_SYMMETRIC) || (A->flags & TAUCS_TRIANGULAR));
  assert(A->flags & TAUCS_LOWER);

  n = A->n;

  *L = (taucs_ccs_matrix*) taucs_malloc(sizeof(taucs_ccs_matrix));
  *R = (taucs_ccs_matrix*) taucs_malloc(sizeof(taucs_ccs_matrix));
  if (!(*L) || !(*R)) { 
    taucs_printf("taucs_ccs_split: out of memory\n");
    taucs_free(*L);
    taucs_free(*R);
    *L = *R = NULL;
    return; 
  }

  Lnnz = 0;
  for (i=0; i<p; i++)
    Lnnz += ( (A->colptr)[i+1] - (A->colptr)[i] );
    
  (*L)->flags |= TAUCS_SYMMETRIC | TAUCS_LOWER;
  (*L)->n = n;
  (*L)->m = n;
  (*L)->colptr = (int*)    taucs_malloc((n+1) * sizeof(int));
  (*L)->rowind = (int*)    taucs_malloc(Lnnz   * sizeof(int));
  (*L)->taucs_values = (void*)   taucs_malloc(Lnnz   * sizeof(taucs_datatype));
  if (!((*L)->colptr) || !((*L)->rowind) || !((*L)->rowind)) {
    	taucs_printf("taucs_ccs_split: out of memory: n=%d nnz=%d\n",n,Lnnz);
	taucs_free((*L)->colptr); taucs_free((*L)->rowind); taucs_free((*L)->taucs_values);
	taucs_free ((*L));
	return; 
  }

  for (i=0; i<=p; i++)
    ((*L)->colptr)[i] = (A->colptr)[i];   
  for (i=p+1; i<n+1; i++)
    ((*L)->colptr)[i] = ((*L)->colptr)[p]; /* other columns are empty */

  for (i=0; i<Lnnz; i++) {
    ((*L)->rowind)[i] = (A->rowind)[i];
    ((*L)->taucs_values)[i] = (A->taucs_values)[i];
  }

  /* now copy right part of matrix into a p-by-p matrix */

  Rnnz = 0;
  for (i=p; i<n; i++)
    Rnnz += ( (A->colptr)[i+1] - (A->colptr)[i] );
    
  (*R)->flags = TAUCS_SYMMETRIC | TAUCS_LOWER;
  (*R)->n = n-p;
  (*R)->m = n-p;
  (*R)->colptr = (int*)    taucs_malloc((n-p+1) * sizeof(int));
  (*R)->rowind = (int*)    taucs_malloc(Rnnz   * sizeof(int));
  (*R)->taucs_values = (void*)   taucs_malloc(Rnnz   * sizeof(taucs_datatype));
  if (!((*R)->colptr) || !((*R)->rowind) || !((*R)->rowind)) {
    	taucs_printf("taucs_ccs_split: out of memory (3): p=%d nnz=%d\n",p,Rnnz);
	taucs_free((*R)->colptr); taucs_free((*R)->rowind); taucs_free((*R)->taucs_values);
	taucs_free((*L)->colptr); taucs_free((*L)->rowind); taucs_free((*L)->taucs_values);
	taucs_free ((*R));
	taucs_free ((*L));
	return; 
  }
    
  for (i=0; i<=(n-p); i++)
    ((*R)->colptr)[i] = (A->colptr)[i+p] - Lnnz;   

  for (i=0; i<Rnnz; i++) {
    ((*R)->rowind)[i] = (A->rowind)[i + Lnnz] - p;
    ((*R)->taucs_values)[i] = (A->taucs_values)[i + Lnnz];
  }
} 

#endif /*#ifndef TAUCS_CORE_GENERAL*/

/*********************************************************/
/* permute symmetrically                                 */
/*********************************************************/

#ifdef TAUCS_CORE_GENERAL
taucs_ccs_matrix* 
taucs_ccs_permute_symmetrically(taucs_ccs_matrix* A, int* perm, int* invperm)
{

#ifdef TAUCS_DOUBLE_IN_BUILD
  if (A->flags & TAUCS_DOUBLE)
    return taucs_dccs_permute_symmetrically(A,perm,invperm);
#endif

#ifdef TAUCS_SINGLE_IN_BUILD
  if (A->flags & TAUCS_SINGLE)
    return taucs_sccs_permute_symmetrically(A,perm,invperm);
#endif

#ifdef TAUCS_DCOMPLEX_IN_BUILD
  if (A->flags & TAUCS_DCOMPLEX)
    return taucs_zccs_permute_symmetrically(A,perm,invperm);
#endif

#ifdef TAUCS_SCOMPLEX_IN_BUILD
  if (A->flags & TAUCS_SCOMPLEX)
    return taucs_cccs_permute_symmetrically(A,perm,invperm);
#endif
  
  assert(0);
  return NULL;
}
#endif /*TAUCS_CORE_GENERAL*/

#ifndef TAUCS_CORE_GENERAL

taucs_ccs_matrix* 
taucs_dtl(ccs_permute_symmetrically)(taucs_ccs_matrix* A, int* perm, int* invperm)
{
  taucs_ccs_matrix* PAPT;
  int n;
  int nnz;
  /*int* colptr;*/
  int* len;
  int i,j,ip,I,J;
  taucs_datatype AIJ;

  assert(A->flags & TAUCS_SYMMETRIC || A->flags & TAUCS_HERMITIAN);
  assert(A->flags & TAUCS_LOWER);

  n   = A->n;
  nnz = (A->colptr)[n];

  PAPT = taucs_dtl(ccs_create)(n,n,nnz);
  if (!PAPT) return NULL;

  /*PAPT->flags = TAUCS_SYMMETRIC | TAUCS_LOWER;*/
  PAPT->flags = A->flags;

  len    = (int*) taucs_malloc(n * sizeof(int));
  /*colptr = (int*) taucs_malloc(n * sizeof(int));*/
  if (!len) {
    taucs_printf("taucs_ccs_permute_symmetrically: out of memory\n");
    taucs_ccs_free(PAPT);
    return NULL;
  }

  for (j=0; j<n; j++) len[j] = 0;

  for (j=0; j<n; j++) {
    for (ip = (A->colptr)[j]; ip < (A->colptr)[j+1]; ip++) {
      /*i = (A->rowind)[ip] - (A->indshift);*/
      i = (A->rowind)[ip];

      I = invperm[i];
      J = invperm[j];

      if (I < J) {
	int T = I; 
	I = J;
	J = T;
      }

      len[J] ++;
      
    }
  }

  (PAPT->colptr)[0] = 0;
  for (j=1; j<=n; j++) (PAPT->colptr)[j] = (PAPT->colptr)[j-1] + len[j-1];

  for (j=0; j<n; j++) len[j] = (PAPT->colptr)[j];
  
  for (j=0; j<n; j++) {
    for (ip = (A->colptr)[j]; ip < (A->colptr)[j+1]; ip++) {
      /*i   = (A->rowind)[ip] - (A->indshift);*/
      i   = (A->rowind)[ip];
      AIJ = (A->taucs_values)[ip];

      I = invperm[i];
      J = invperm[j];

      if (I < J) {
	int T = I; 
	I = J;
	J = T;
	if (A->flags & TAUCS_HERMITIAN) AIJ = taucs_conj(AIJ);
      }

      /*(PAPT->rowind)[ len[J] ] = I + (PAPT->indshift);*/
      (PAPT->rowind)[ len[J] ] = I;
      (PAPT->taucs_values)[ len[J] ] = AIJ;

      len[J] ++;
    }
  }

  taucs_free(len);
  return PAPT;
}

#endif /*#ifndef TAUCS_CORE_GENERAL*/

/*********************************************************/
/* compute B = A*X                                       */
/* current restrictions: A must be square, real          */
/*********************************************************/

#ifdef TAUCS_CORE_GENERAL
void 
taucs_ccs_times_vec(taucs_ccs_matrix* m, 
		    void* X,
		    void* B)
{

#ifdef TAUCS_DOUBLE_IN_BUILD
  if (m->flags & TAUCS_DOUBLE)
    taucs_dccs_times_vec(m, (taucs_double*) X, (taucs_double*) B);
#endif

#ifdef TAUCS_SINGLE_IN_BUILD
  if (m->flags & TAUCS_SINGLE)
    taucs_sccs_times_vec(m, (taucs_single*) X, (taucs_single*) B);
#endif

#ifdef TAUCS_DCOMPLEX_IN_BUILD
  if (m->flags & TAUCS_DCOMPLEX)
    taucs_zccs_times_vec(m, (taucs_dcomplex*) X, (taucs_dcomplex*) B);
#endif

#ifdef TAUCS_SCOMPLEX_IN_BUILD
  if (m->flags & TAUCS_SCOMPLEX)
    taucs_cccs_times_vec(m, (taucs_scomplex*) X, (taucs_scomplex*) B);
#endif
  
  
}
#endif /*TAUCS_CORE_GENERAL*/

#ifndef TAUCS_CORE_GENERAL

void 
taucs_dtl(ccs_times_vec)(taucs_ccs_matrix* m, 
			 taucs_datatype* X,
			 taucs_datatype* B)
{
  int i,ip,j,n;
  taucs_datatype Aij;

  n = m->n;
  
  for (i=0; i < n; i++) B[i] = taucs_zero;

  if (m->flags & TAUCS_SYMMETRIC) {
    for (j=0; j<n; j++) {
      for (ip = (m->colptr)[j]; ip < (m->colptr[j+1]); ip++) {
	i   = (m->rowind)[ip];
	Aij = (m->taucs_values)[ip];
	
	B[i] = taucs_add(B[i],taucs_mul(X[j],Aij));
	if (i != j) 
	  B[j] = taucs_add(B[j],taucs_mul(X[i],Aij));
      }
    }
  } else if (m->flags & TAUCS_HERMITIAN) {
    for (j=0; j<n; j++) {
      for (ip = (m->colptr)[j]; ip < (m->colptr[j+1]); ip++) {
	i   = (m->rowind)[ip];
	Aij = (m->taucs_values)[ip];
	
	B[i] = taucs_add(B[i],taucs_mul(X[j],Aij));
	if (i != j) 
	  B[j] = taucs_add(B[j],taucs_mul(X[i],
					  taucs_conj(Aij)));
      }
    }
  } else {
    for (j=0; j<n; j++) {
      for (ip = (m->colptr)[j]; ip < (m->colptr[j+1]); ip++) {
	i   = (m->rowind)[ip];
	Aij = (m->taucs_values)[ip];
	
	B[i] = taucs_add(B[i],taucs_mul(X[j],Aij));
      }
    }
  }
} 

#endif /*#ifndef TAUCS_CORE_GENERAL*/

#ifdef TAUCS_CORE_SINGLE
void 
taucs_sccs_times_vec_dacc(taucs_ccs_matrix* m, 
			 taucs_single* X,
			 taucs_single* B)
{
  int i,ip,j,n;
  taucs_single Aij;
  taucs_double* Bd;

  assert(m->flags & TAUCS_SYMMETRIC);
  assert(m->flags & TAUCS_LOWER);
  assert(m->flags & TAUCS_SINGLE);

  n = m->n;

  Bd = (taucs_double*) taucs_malloc(n * sizeof(taucs_double));
  if (Bd == NULL) {
    taucs_sccs_times_vec(m,X,B);
    return;
  }
  
  for (i=0; i < n; i++) Bd[i] = 0.0;

  for (j=0; j<n; j++) {
    for (ip = (m->colptr)[j]; ip < (m->colptr[j+1]); ip++) {
      i   = (m->rowind)[ip];
      Aij = (m->taucs_values)[ip];

      Bd[i] += X[j] * Aij;
      if (i != j) 
	Bd[j] += X[i] *Aij;
    }
  }

  for (i=0; i < n; i++) B[i] = (taucs_single) Bd[i];
  taucs_free(Bd);
} 
#endif

/*********************************************************/
/* augment diagonals to diagonal dominance               */
/* current restrictions: A must be square, real          */
/*********************************************************/

#ifdef TAUCS_CORE_GENERAL
taucs_ccs_matrix* 
taucs_ccs_augment_nonpositive_offdiagonals(taucs_ccs_matrix* A)
{

#ifdef TAUCS_DOUBLE_IN_BUILD
  if (A->flags & TAUCS_DOUBLE)
    taucs_dccs_augment_nonpositive_offdiagonals(A);
#endif

#ifdef TAUCS_SINGLE_IN_BUILD
  if (A->flags & TAUCS_SINGLE)
    taucs_sccs_augment_nonpositive_offdiagonals(A);
#endif

#ifdef TAUCS_DCOMPLEX_IN_BUILD
  if (A->flags & TAUCS_DCOMPLEX)
    taucs_zccs_augment_nonpositive_offdiagonals(A);
#endif

#ifdef TAUCS_SCOMPLEX_IN_BUILD
  if (A->flags & TAUCS_SCOMPLEX)
    taucs_cccs_augment_nonpositive_offdiagonals(A);
#endif
  
      
  assert(0);
  return NULL;
}
#endif /*TAUCS_CORE_GENERAL*/

#ifndef TAUCS_CORE_GENERAL

taucs_ccs_matrix* 
taucs_dtl(ccs_augment_nonpositive_offdiagonals)(taucs_ccs_matrix* A)
{
#ifdef TAUCS_CORE_COMPLEX
  assert(0);
#else
  int n,i,j;
  int *tmp;
  taucs_ccs_matrix* A_tmp;
  
  if (!(A->flags & TAUCS_SYMMETRIC) || !(A->flags & TAUCS_LOWER)) {
    taucs_printf("taucs_ccs_augment_nonpositive_offdiagonal: matrix not symmetric or not lower\n");
    return NULL;
  }

  n=A->n;

  tmp = (int *)taucs_calloc((2*n+1),sizeof(int));
  if (!tmp) {
    taucs_printf("taucs_ccs_augment_nonpositive_offdiagonal: out of memory\n");
    return NULL;
  }

  A_tmp = taucs_dtl(ccs_create)(2*n,2*n,2*(A->colptr[n]));
  if (A_tmp == NULL) {
    taucs_free(tmp);
    return NULL;
  }
  A_tmp->flags |= TAUCS_SYMMETRIC | TAUCS_LOWER;
  
  
  for(i=0;i<n;i++) {
    for(j=A->colptr[i];j<A->colptr[i+1];j++) {
      if ((i == A->rowind[j])||(A->taucs_values[j] < 0)) {
	tmp[i]++;
	tmp[i+n]++;
      } else {
	tmp[i]++;
	tmp[A->rowind[j]]++;
      }
    }
  }

  A_tmp->colptr[0]=0;
  for(i=0;i<2*n;i++) A_tmp->colptr[i+1] = A_tmp->colptr[i] + tmp[i];
  for(i=0;i<2*n;i++) tmp[i] = A_tmp->colptr[i];
  
  for(i=0;i<n;i++) {
    for(j=A->colptr[i];j<A->colptr[i+1];j++) {
      if ((i == A->rowind[j])||(A->taucs_values[j] < 0)) {
	A_tmp->rowind[tmp[i]]=A->rowind[j];
	A_tmp->taucs_values[tmp[i]++]=A->taucs_values[j];
	A_tmp->rowind[tmp[i+n]]=A->rowind[j]+n;
	A_tmp->taucs_values[tmp[i+n]++]=A->taucs_values[j];
      } else {
	A_tmp->rowind[tmp[i]]=A->rowind[j]+n;
	A_tmp->taucs_values[tmp[i]++]=-A->taucs_values[j];
	A_tmp->rowind[tmp[A->rowind[j]]]=i+n;
	A_tmp->taucs_values[tmp[A->rowind[j]]++]=-A->taucs_values[j];
      }
    }
  }
  taucs_free(tmp);

  return A_tmp;
#endif
	/* added omer*/
	return NULL;
}

#endif /*#ifndef TAUCS_CORE_GENERAL*/
/*********************************************************/
/*                                                       */
/*********************************************************/



syntax highlighted by Code2HTML, v. 0.9.1