/*  testScatterDenseMtx.c  */

#include "../spoolesMPI.h"
#include "../../Drand.h"
#include "../../timings.h"

/*--------------------------------------------------------------------*/

int
main ( int argc, char *argv[] )
/*
   ------------------------------------------------------------------
   this program tests the simple split and merge of a DenseMtx object

   (1) process root generates a nrow x ncol DenseMtx object
   (2) using a random map, scatter the rows into local matrices
   (3) gather the local matrices into a second global matrix
       and compare

   created -- 98sep26, cca
   ------------------------------------------------------------------
*/
{
char        *buffer ;
DenseMtx    *X, *Y, *Z ;
double      t1, t2 ;
double      checksums[3], Xchecksums[3], Ychecksums[3], Zchecksums[3] ;
Drand       drand ;
int         inc1, inc2, length, myid, msglvl, ncol, 
            nproc, nrow, root, seed, tag, type, v ;
int         *map ;
int         stats[4], tstats[4] ;
IV          *mapIV ;
FILE        *msgFile ;
/*
   ---------------------------------------------------------------
   find out the identity of this process and the number of process
   ---------------------------------------------------------------
*/
/*
fprintf(stdout, "\n stdout, MPI_COMM_WORLD = %p", MPI_COMM_WORLD) ;
fflush(stdout) ;
*/
MPI_Init(&argc, &argv) ;
MPI_Comm_rank(MPI_COMM_WORLD, &myid) ;
MPI_Comm_size(MPI_COMM_WORLD, &nproc) ;
/*
fprintf(stdout, "\n process %d of %d, argc = %d", myid, nproc, argc) ;
fflush(stdout) ;
*/
if ( argc != 10 ) {
   fprintf(stdout, 
"\n\n usage : %s msglvl msgFile type nrow ncol inc1 inc2 seed root"
"\n    msglvl  -- message level"
"\n    msgFile -- message file"
"\n    type    -- type of entries"
"\n      1 -- real"
"\n      2 -- complex"
"\n    nrow -- number of rows"
"\n    ncol -- number of columns"
"\n    inc1 -- row increment"
"\n    inc2 -- column increment"
"\n    seed -- random number seed"
"\n    root -- root processor"
"\n", argv[0]) ;
   return(0) ;
}
msglvl = atoi(argv[1]) ;
if ( strcmp(argv[2], "stdout") == 0 ) {
   msgFile = stdout ;
} else {
   length = strlen(argv[2]) + 1 + 4 ;
   buffer = CVinit(length, '\0') ;
   sprintf(buffer, "%s.%d", argv[2], myid) ;
   if ( (msgFile = fopen(buffer, "w")) == NULL ) {
      fprintf(stderr, "\n fatal error in %s"
              "\n unable to open file %s\n",
              argv[0], argv[2]) ;
      return(0) ;
   }
   CVfree(buffer) ;
}
type = atoi(argv[3]) ;
nrow = atoi(argv[4]) ;
ncol = atoi(argv[5]) ;
inc1 = atoi(argv[6]) ;
inc2 = atoi(argv[7]) ;
seed = atoi(argv[8]) ;
root = atoi(argv[9]) ;
fprintf(msgFile, 
        "\n %s "
        "\n msglvl     -- %d" 
        "\n msgFile    -- %s" 
        "\n type       -- %d" 
        "\n nrow       -- %d" 
        "\n ncol       -- %d" 
        "\n inc1       -- %d" 
        "\n inc2       -- %d" 
        "\n seed       -- %d" 
        "\n root       -- %d" 
        "\n",
        argv[0], msglvl, argv[2], type, nrow, ncol, 
        inc1, inc2, seed, root) ;
fflush(msgFile) ;
/*
   -----------------------------
   generate the DenseMtx object
   -----------------------------
*/
if ( myid == root ) {
   X = DenseMtx_new() ;
   fprintf(msgFile, "\n X = %p", X) ;
   fflush(msgFile) ;
   MARKTIME(t1) ;
   DenseMtx_init(X, type, 1, -1, nrow, ncol, inc1, inc2) ;
   Drand_setDefaultFields(&drand) ;
   Drand_setSeed(&drand, seed) ;
   Drand_setUniform(&drand, 0.0, 1.0) ;
   switch ( type ) {
   case SPOOLES_REAL :
      Drand_fillDvector(&drand, nrow*ncol, DenseMtx_entries(X)) ;
      break ;
   case SPOOLES_COMPLEX :
      Drand_fillDvector(&drand, 2*nrow*ncol, DenseMtx_entries(X)) ;
      break ;
   }
/*
   ------------------------------------------
   compute the serial checksums of the matrix
   ------------------------------------------
*/
   DenseMtx_checksums(X, Xchecksums) ;
   MARKTIME(t2) ;
   fprintf(msgFile, "\n CPU %8.3f : initialize the DenseMtx object",
           t2 - t1) ;
   fflush(msgFile) ;
   fprintf(msgFile, "\n\n DenseMtx generated") ;
   if ( msglvl > 2 ) {
      DenseMtx_writeForHumanEye(X, msgFile) ;
   } else {
      DenseMtx_writeStats(X, msgFile) ;
   }
   fflush(msgFile) ;
/*
   ---------------------
   generate a random map
   ---------------------
*/
   MARKTIME(t1) ;
   mapIV = IV_new() ;
   IV_init(mapIV, nrow, NULL) ;
   map = IV_entries(mapIV) ;
   Drand_setDefaultFields(&drand) ;
   Drand_setSeed(&drand, seed) ;
   Drand_setUniform(&drand, 0.0, (double) nrow) ;
   for ( v = 0 ; v < nrow ; v++ ) {
      map[v] = ((int) Drand_value(&drand)) % nproc ;
      if ( map[v] == root ) {
         map[v] = nproc - 1 ;
      }
   }
   MARKTIME(t2) ;
   fprintf(msgFile, "\n CPU %8.3f : generate random map", t2 - t1) ;
   fflush(msgFile) ;
   if ( msglvl > 2 ) {
      fprintf(msgFile, "\n\n map") ;
      IV_writeForHumanEye(mapIV, msgFile) ;
      fflush(msgFile) ;
   }
} else {
   X = NULL ;
   mapIV = NULL ;
}
/*
   ------------------------------------------
   now scatter the matrix with the random map
   ------------------------------------------
*/
stats[0]  = stats[1]  = stats[2]  = stats[3]  = 0 ;
tstats[0] = tstats[1] = tstats[2] = tstats[3] = 0 ;
MARKTIME(t1) ;
tag = 1 ;
Y = DenseMtx_MPI_splitFromGlobalByRows(X, NULL, mapIV, root, stats, 
                              msglvl, msgFile, tag, MPI_COMM_WORLD) ;
MARKTIME(t2) ;
fprintf(msgFile, "\n CPU %8.3f : scatter matrix ", t2 - t1) ;
fprintf(msgFile, 
        "\n send stats : %d messages with %d bytes"
        "\n recv stats : %d messages with %d bytes",
        stats[0], stats[2], stats[1], stats[3]) ;
fflush(msgFile) ;
MPI_Reduce((void *) stats, (void *) tstats, 4, MPI_INT,
          MPI_SUM, root, MPI_COMM_WORLD) ;
if ( myid == root ) {
   fprintf(msgFile, 
           "\n total send stats : %d messages with %d bytes"
           "\n total recv stats : %d messages with %d bytes",
           tstats[0], tstats[2], tstats[1], tstats[3]) ;
   fflush(msgFile) ;
}
if ( Y != NULL ) {
   fprintf(msgFile, "\n\n local matrix") ;
   if ( msglvl > 2 ) {
      DenseMtx_writeForHumanEye(Y, msgFile) ;
   } else {
      DenseMtx_writeStats(Y, msgFile) ;
   }
} else {
   fprintf(msgFile, "\n\n local matrix is NULL") ;
}
fflush(msgFile) ;
/*
   -----------------------------------------------
   compute the checksums of the distributed matrix
   -----------------------------------------------
*/
if ( Y != NULL ) {
   DenseMtx_checksums(Y, checksums) ;
} else {
   checksums[0] = checksums[1] = checksums[2] = 0.0 ;
}
MPI_Reduce((void *) checksums, (void *) Ychecksums, 3, MPI_DOUBLE,
          MPI_SUM, root, MPI_COMM_WORLD) ;
if ( myid == root ) {
   fprintf(msgFile, 
           "\n\n checksums for original matrix    : %12.4e %12.4e"
           "\n checksums for distributed matrix : %12.4e %12.4e"
           "\n error in checksum                : %12.4e %12.4e",
         Xchecksums[0], Xchecksums[2], Ychecksums[0], Ychecksums[2],
         Ychecksums[0] - Xchecksums[0], Ychecksums[2] - Xchecksums[2]) ;
}
/*
   -----------------------------------------------------
   gather the local matrices into a second global matrix
   -----------------------------------------------------
*/
MARKTIME(t1) ;
stats[0] = stats[1] = stats[2] = stats[3] = 0 ;
if ( myid == root ) {
   Z = DenseMtx_new() ;
   fprintf(msgFile, "\n Z = %p", Z) ;
} else {
   Z = NULL ;
}
Z = DenseMtx_MPI_mergeToGlobalByRows(Z, Y, root, stats, msglvl,
                                     msgFile, tag, MPI_COMM_WORLD) ;
fprintf(msgFile, "\n Z = %p", Z) ;
MARKTIME(t2) ;
fprintf(msgFile, "\n CPU %8.3f : merge into global matrix ", t2 - t1) ;
fprintf(msgFile, "\n send stats : %d messages with %d bytes"
                 "\n recv stats : %d messages with %d bytes",
                 stats[0], stats[2], stats[1], stats[3]) ;
fflush(msgFile) ;
MPI_Reduce((void *) stats, (void *) tstats, 4, MPI_INT,
          MPI_SUM, root, MPI_COMM_WORLD) ;
if ( myid == root ) {
   fprintf(msgFile, "\n total send stats : %d messages with %d bytes"
                    "\n total recv stats : %d messages with %d bytes",
                    tstats[0], tstats[2], tstats[1], tstats[3]) ;
   DenseMtx_sort(Z) ;
   fprintf(msgFile, "\n\n global Z matrix") ;
   if ( msglvl > 2 ) {
      DenseMtx_writeForHumanEye(Z, msgFile) ;
   } else {
      DenseMtx_writeStats(Z, msgFile) ;
   }
   fflush(msgFile) ;
   DenseMtx_checksums(Z, Zchecksums) ;
   fprintf(msgFile, 
           "\n\n checksums for original matrix    : %12.4e %12.4e"
           "\n checksums for distributed matrix : %12.4e %12.4e"
           "\n checksums for global matrix      : %12.4e %12.4e"
           "\n X x Y error in checksum          : %12.4e %12.4e"
           "\n X x Z error in checksum          : %12.4e %12.4e",
         Xchecksums[0], Xchecksums[2], 
         Ychecksums[0], Ychecksums[2],
         Zchecksums[0], Zchecksums[2],
         Xchecksums[0] - Ychecksums[0], Xchecksums[2] - Ychecksums[2],
         Xchecksums[0] - Zchecksums[0], Xchecksums[2] - Zchecksums[2]) ;
}
/*
   ----------------
   free the objects
   ----------------
*/
if ( myid == root ) {
   IV_free(mapIV) ;
}
if ( X != NULL ) {
   DenseMtx_free(X) ;
}
if ( Y != NULL ) {
   DenseMtx_free(Y) ;
}
if ( Z != NULL ) {
   DenseMtx_free(Z) ;
}
MPI_Finalize() ;

fprintf(msgFile, "\n") ;
fclose(msgFile) ;

return(0) ; }

/*--------------------------------------------------------------------*/


syntax highlighted by Code2HTML, v. 0.9.1