/* This software was developed by Bruce Hendrickson and Robert Leland   *
 * at Sandia National Laboratories under US Department of Energy        *
 * contract DE-AC04-76DP00789 and is copyrighted by Sandia Corporation. */

#include <stdio.h>
#include "params.h"
#include "defs.h"
#include "structs.h"

int LIMIT_KL_EWGTS = FALSE;	/* limit range of edge weights in multilevel-KL? */
double EWGT_RATIO_MAX = .25;	/* if so, max allowed ewgt/nvtxs */

void      coarsen_kl(graph, nvtxs, nedges, using_vwgts, using_ewgts, term_wgts,
		     igeom, coords, vwgt_max, assignment, goal, architecture, hops,
		          solver_flag, ndims, nsets, vmax, mediantype, mkconnected,
		               eigtol, nstep, step, pbndy_list, weights, give_up)
/* Coarsen until nvtxs < vmax, compute and uncoarsen. */
struct vtx_data **graph;	/* array of vtx data for graph */
int       nvtxs;		/* number of vertices in graph */
int       nedges;		/* number of edges in graph */
int       using_vwgts;		/* are vertices weights being used? */
int       using_ewgts;		/* are edge weights being used? */
float    *term_wgts[];		/* weights for terminal propogation */
int       igeom;                /* dimension for geometric information */
float   **coords;               /* coordinates for vertices */
int       vwgt_max;		/* largest vertex weight */
short    *assignment;		/* processor each vertex gets assigned to */
double   *goal;			/* desired set sizes */
int       architecture;		/* 0 => hypercube, d => d-dimensional mesh */
short     (*hops)[MAXSETS];	/* cost of edge between sets */
int       solver_flag;		/* which eigensolver to use */
int       ndims;		/* number of eigenvectors to calculate */
int       nsets;		/* number of sets being divided into */
int       vmax;			/* largest subgraph to stop coarsening */
int       mediantype;		/* flag for different assignment strategies */
int       mkconnected;		/* make graph connected before eigensolver? */
double    eigtol;		/* tolerence in eigen calculation */
int       nstep;		/* number of coarsenings between RQI steps */
int       step;			/* current step number */
int     **pbndy_list;		/* pointer to returned boundary list */
double   *weights;		/* weights of vertices in each set */
int       give_up;		/* has coarsening bogged down? */
{
    extern FILE *Output_File;	/* output file or null */
    extern int DEBUG_TRACE;	/* trace the execution of the code */
    extern int DEBUG_COARSEN;	/* debug flag for coarsening */
    extern int DEBUG_CONNECTED;	/* debug flag for connectivity checking */
    extern double COARSEN_RATIO_MIN;	/* vtx reduction demanded */
    extern int COARSEN_VWGTS;	/* use vertex weights while coarsening? */
    extern int COARSEN_EWGTS;	/* use edge weights while coarsening? */
    extern int COARSE_KL_BOTTOM;/* force KL invocation at bottom level? */
    extern int KL_ONLY_BNDY;	/* only initialize boundary vertices? */
    extern double KL_IMBALANCE;	/* fractional imbalance allowed in KL */
    extern int MAPPING_TYPE;	/* how to get from eigenvectors to partition */
    struct connect_data *cdata;	/* data structure for enforcing connectivity */
    struct vtx_data **cgraph;	/* array of vtx data for coarsened graph */
    double   *yvecs[MAXDIMS + 1];	/* eigenvectors for subgraph */
    double    evals[MAXDIMS + 1];	/* eigenvalues returned */
    double    new_goal[MAXSETS];/* new goal if not using vertex weights */
    double   *real_goal;	/* chooses between goal and new_goal */
    double    goal_weight;	/* total weight of vertices in goal */
    double   *vwsqrt = NULL;	/* square root of vertex weights */
    double    maxdeg;		/* maximum weighted degree of a vertex */
    double    temp_goal[2];     /* goal to simulate bisection while striping */
    double   *fake_goal;        /* either goal or temp_goal */
    float    *cterm_wgts[MAXSETS];	/* terminal weights for coarse graph */
    float    *new_term_wgts[MAXSETS];	/* modified for Bui's method */
    float   **real_term_wgts;	/* which of previous two to use */
    float     ewgt_max;		/* largest edge weight in graph */
    float    *twptr;		/* loops through term_wgts */
    float    *twptr_save;	/* copy of twptr */
    float    *ctwptr;		/* loops through cterm_wgts */
    float   **ccoords;		/* coarse graph coordinates */
    int      *active;		/* space for assign routine */
    int      *v2cv;		/* mapping from fine to coarse vertices */
    int      *cv2v;		/* mapping from coarse to fine vertices */
    int      *bndy_list;	/* list of vertices on boundary */
    int      *cbndy_list;	/* list of vertices of coarse graph on boundary */
    int      *mflag;		/* flags indicating matching */
    short    *cassignment;	/* set assignments for coarsened vertices */
    int       clist_length;	/* length of coarse graph boundary vtx list */
    int       list_length;	/* length of boundary vtx list */
    int       vtx;		/* vertex in graph */
    int       cvtx;		/* vertex in coarse graph */
    int       cnvtxs;		/* number of vertices in coarsened graph */
    int       cnedges;		/* number of edges in coarsened graph */
    int       cvwgt_max;	/* largest vertex weight in coarsened graph */
    int       nextstep;		/* next step in RQI test */
    int       max_dev;		/* largest allowed deviation from balance */
    int       set;		/* set a vertex is in */
    int       i, j;		/* loop counters */
    int       sfree();
    double   *smalloc(), *srealloc(), find_maxdeg();
    void      makevwsqrt(), make_connected(), print_connected(), eigensolve();
    void      make_unconnected(), assign(), klspiff(), coarsen1(), free_graph();
    void      compress_ewgts(), restore_ewgts(), count_weights();

    if (DEBUG_COARSEN > 0 || DEBUG_TRACE > 0) {
	printf("<Entering coarsen_kl, step=%d, nvtxs=%d, nedges=%d, vmax=%d>\n",
	       step, nvtxs, nedges, vmax);
    }

    /* Is problem small enough to solve? */
    if (nvtxs <= vmax || give_up) {
	if (using_vwgts) {
	    vwsqrt = (double *) smalloc((unsigned) (nvtxs + 1) * sizeof(double));
	    makevwsqrt(vwsqrt, graph, nvtxs);
	}
	else
	    vwsqrt = NULL;

	/* Create space for subgraph yvecs. */
	for (i = 1; i <= ndims; i++) {
	    yvecs[i] = (double *) smalloc((unsigned) (nvtxs + 1) * sizeof(double));
	}

	active = (int *) smalloc((unsigned) nvtxs * sizeof(int));
	if (mkconnected) {
	    make_connected(graph, nvtxs, &nedges, (short *) &(yvecs[1][0]),
			   active, &cdata, using_ewgts);
	    if (DEBUG_CONNECTED > 0) {
		printf("Enforcing connectivity on coarse graph\n");
		print_connected(cdata);
	    }
	}

	/* If not coarsening ewgts, then need care with term_wgts. */
	if (!using_ewgts && term_wgts[1] != NULL && step != 0) {
	    twptr = (float *) smalloc((unsigned)
		(nvtxs + 1) * (nsets - 1) * sizeof(float));
	    twptr_save = twptr;
	    for (j = 1; j < nsets; j++) {
	        new_term_wgts[j] = twptr;
	        twptr += nvtxs + 1;
	    }

	    for (j = 1; j < nsets; j++) {
	        twptr = term_wgts[j];
	        ctwptr = new_term_wgts[j];
	        for (i = 1; i <= nvtxs; i++) {
		    if (twptr[i] > .5) ctwptr[i] = 1;
		    else if (twptr[i] < -.5) ctwptr[i] = -1;
		    else ctwptr[i] = 0;
		}
	    }
	    real_term_wgts = new_term_wgts;
	}
	else {
	    real_term_wgts = term_wgts;
	    new_term_wgts[1] = NULL;
	}

	if (!COARSEN_VWGTS && step != 0) {	/* Construct new goal */
	    goal_weight = 0;
	    for (i = 0; i < nsets; i++)
		goal_weight += goal[i];
	    for (i = 0; i < nsets; i++)
		new_goal[i] = goal[i] * (nvtxs / goal_weight);
	    real_goal = new_goal;
	}
	else
	    real_goal = goal;

	if (ndims == 1 && nsets > 2) {		/* Striping. */
	    mediantype = 4;
	    temp_goal[0] = temp_goal[1] = 0;
	    for (i = 0; 2 * i + 1 < nsets; i++) {
		 temp_goal[0] += real_goal[i];
		 temp_goal[1] += real_goal[nsets - 1 - i];
	    }
	    i = nsets / 2;
	    if (2 * i != nsets) {
		temp_goal[0] += .5 * real_goal[i];
		temp_goal[1] += .5 * real_goal[i];
	    }
	    fake_goal = temp_goal;
	}
	else {
	    mediantype = MAPPING_TYPE;
	    fake_goal = real_goal;
	}

	/* Partition coarse graph with spectral method */
	maxdeg = find_maxdeg(graph, nvtxs, using_ewgts, &ewgt_max);
	eigensolve(graph, nvtxs, nedges, maxdeg, vwgt_max, vwsqrt,
		   using_vwgts, using_ewgts, real_term_wgts, 0, (float **) NULL,
		   yvecs, evals, architecture, assignment, fake_goal,
		   solver_flag, FALSE, 0, ndims, mediantype, eigtol);

	if (mkconnected)
	    make_unconnected(graph, &nedges, &cdata, using_ewgts);

	assign(graph, yvecs, nvtxs, ndims, architecture, nsets, vwsqrt, assignment,
	       active, mediantype, real_goal, vwgt_max);
/*
simple_part(graph, nvtxs, assignment, nsets, 1, real_goal);
*/
	sfree((char *) active);

	count_weights(graph, nvtxs, assignment, nsets, weights, (vwgt_max != 1));

	bndy_list = NULL;
	if (COARSE_KL_BOTTOM || !(step % nstep)) {
	    if (LIMIT_KL_EWGTS)
		compress_ewgts(graph, nvtxs, nedges, ewgt_max, using_ewgts);

	    max_dev = (step == 0) ? vwgt_max : 5 * vwgt_max;
	    goal_weight = 0;
	    for (i = 0; i < nsets; i++) {
		goal_weight += real_goal[i];
	    }
	    goal_weight *= KL_IMBALANCE / nsets;
	    if (goal_weight > max_dev) {
		max_dev = goal_weight;
	    }

	    if (KL_ONLY_BNDY) {
		/* On small graph, quickest to include everybody in list. */
		bndy_list = (int *) smalloc((unsigned) (nvtxs+1)*sizeof(int));
		for (i=0; i<nvtxs; i++) {
		    bndy_list[i] = i+1;
		}
		bndy_list[nvtxs] = 0;
	    }
	    klspiff(graph, nvtxs, assignment, nsets, hops, real_goal,
		    real_term_wgts, max_dev, maxdeg, using_ewgts,
		    &bndy_list, weights);
	    if (LIMIT_KL_EWGTS)
		restore_ewgts(graph, nvtxs);
	}

	else if (KL_ONLY_BNDY) {	/* Find boundary vertices directly. */
	    bndy_list = (int *) smalloc((unsigned) (nvtxs+1)*sizeof(int));
	    list_length = 0;
	    for (i=1; i<=nvtxs; i++) {
		set = assignment[i];
		for (j=1; j<graph[i]->nedges; j++) {
		    if (assignment[graph[i]->edges[j]] != set) {
			bndy_list[list_length++] = i;
			break;
		    }
		}
	    }
	    bndy_list[list_length] = 0;
	    bndy_list = (int *) srealloc((char *) bndy_list,
			(unsigned) (list_length + 1) * sizeof(int));
	}
	*pbndy_list = bndy_list;

	if (real_term_wgts != term_wgts && new_term_wgts[1] != NULL) {
	    sfree((char *) real_term_wgts[1]);
	}
	if (vwsqrt != NULL)
	    sfree((char *) vwsqrt);
	for (i = ndims; i > 0; i--)
	    sfree((char *) yvecs[i]);
	return;
    }

    /* Otherwise I have to coarsen. */
    if (coords != NULL) {
        ccoords = (float **) smalloc((unsigned) igeom * sizeof(float *));
    }
    else {
        ccoords = NULL;
    }
    coarsen1(graph, nvtxs, nedges, &cgraph, &cnvtxs, &cnedges, &v2cv,
	     igeom, coords, ccoords, using_ewgts);

    if (term_wgts[1] != NULL) {
	twptr = (float *) smalloc((unsigned)
	    (cnvtxs + 1) * (nsets - 1) * sizeof(float));
	twptr_save = twptr;
	for (i = (cnvtxs + 1) * (nsets - 1); i ; i--) {
	    *twptr++ = 0;
	}
	twptr = twptr_save;
	for (j = 1; j < nsets; j++) {
	    cterm_wgts[j] = twptr;
	    twptr += cnvtxs + 1;
	}
	for (j = 1; j < nsets; j++) {
	    ctwptr = cterm_wgts[j];
	    twptr = term_wgts[j];
	    for (i = 1; i < nvtxs; i++){
	        ctwptr[v2cv[i]] += twptr[i];
	    }
	}
    }
    else {
	cterm_wgts[1] = NULL;
    }

    /* If coarsening isn't working very well, give up and partition. */
    give_up = FALSE;
    if (nvtxs * COARSEN_RATIO_MIN < cnvtxs && cnvtxs > vmax) {
	printf("WARNING: Coarsening not making enough progress, nvtxs = %d, cnvtxs = %d.\n",
	    nvtxs, cnvtxs);
	printf("         Recursive coarsening being stopped prematurely.\n");
	if (Output_File != NULL) {
	    fprintf(Output_File, 
		"WARNING: Coarsening not making enough progress, nvtxs = %d, cnvtxs = %d.\n",
	    nvtxs, cnvtxs);
	    fprintf(Output_File, 
		"         Recursive coarsening being stopped prematurely.\n");
	}
	give_up = TRUE;
    }

    /* Now recurse on coarse subgraph. */
    if (COARSEN_VWGTS) {
	cvwgt_max = 0;
	for (i = 1; i <= cnvtxs; i++) {
	    if (cgraph[i]->vwgt > cvwgt_max)
		cvwgt_max = cgraph[i]->vwgt;
	}
    }
    else
	cvwgt_max = 1;

    cassignment = (short *) smalloc((unsigned) (cnvtxs + 1) * sizeof(short));
    nextstep = step + 1;
    coarsen_kl(cgraph, cnvtxs, cnedges, COARSEN_VWGTS, COARSEN_EWGTS, cterm_wgts,
	       igeom, ccoords, cvwgt_max, cassignment, goal, architecture, hops,
	       solver_flag, ndims, nsets, vmax, mediantype, mkconnected,
	       eigtol, nstep, nextstep, &cbndy_list, weights, give_up);

    /* Interpolate assignment back to fine graph. */
    for (i = 1; i <= nvtxs; i++)
	assignment[i] = cassignment[v2cv[i]];

    if (KL_ONLY_BNDY) {
	/* Construct boundary list from coarse boundary list. */
	cv2v = (int *) smalloc((unsigned) (cnvtxs + 1) * sizeof(int));
        mflag = (int *) smalloc((unsigned) (nvtxs + 1) * sizeof(int));
	for (i=1; i<=cnvtxs; i++) {
	    cv2v[i] = 0;
	}
	for (i=1; i<=nvtxs; i++) {
	    mflag[i] = 0;
	    cvtx = v2cv[i];
	    if (cv2v[cvtx] == 0) {
		cv2v[cvtx] = i;
	    }
	    else {
		mflag[cv2v[cvtx]] = i;
	    }
	}

	clist_length = 0;
	while (cbndy_list[clist_length] != 0) {
	    clist_length++;
	}
	bndy_list = (int *) smalloc((unsigned) (2 * clist_length + 1) * sizeof(int));

	list_length = 0;
	for (i=0; i<clist_length; i++) {
	    vtx = cv2v[cbndy_list[i]];
	    bndy_list[list_length++] = vtx;
	    if (mflag[vtx] != 0) {
		bndy_list[list_length++] = mflag[vtx];
	    }
	}
	bndy_list[list_length] = 0;
	bndy_list = (int *) srealloc((char *) bndy_list,
			(unsigned) (list_length + 1) * sizeof(int));

        sfree((char *) mflag);
	sfree((char *) cv2v);
	sfree((char *) cbndy_list);
    }
    else {
	bndy_list = NULL;
    }

    /* Free the space that was allocated. */
    sfree((char *) cassignment);
    if (cterm_wgts[1] != NULL)
	sfree((char *) cterm_wgts[1]);
    free_graph(cgraph);
    sfree((char *) v2cv);

    /* Smooth using KL every nstep steps. */
    if (!(step % nstep)) {
	if (!COARSEN_VWGTS && step != 0) {	/* Construct new goal */
	    goal_weight = 0;
	    for (i = 0; i < nsets; i++)
		goal_weight += goal[i];
	    for (i = 0; i < nsets; i++)
		new_goal[i] = goal[i] * (nvtxs / goal_weight);
	    real_goal = new_goal;
	}
	else
	    real_goal = goal;

	maxdeg = find_maxdeg(graph, nvtxs, using_ewgts, &ewgt_max);
	if (LIMIT_KL_EWGTS)
	    compress_ewgts(graph, nvtxs, nedges, ewgt_max,
			   using_ewgts);

	/* If not coarsening ewgts, then need care with term_wgts. */
	if (!using_ewgts && term_wgts[1] != NULL && step != 0) {
	    twptr = (float *) smalloc((unsigned)
		(nvtxs + 1) * (nsets - 1) * sizeof(float));
	    twptr_save = twptr;
	    for (j = 1; j < nsets; j++) {
	        new_term_wgts[j] = twptr;
	        twptr += nvtxs + 1;
	    }

	    for (j = 1; j < nsets; j++) {
	        twptr = term_wgts[j];
	        ctwptr = new_term_wgts[j];
	        for (i = 1; i <= nvtxs; i++) {
		    if (twptr[i] > .5) ctwptr[i] = 1;
		    else if (twptr[i] < -.5) ctwptr[i] = -1;
		    else ctwptr[i] = 0;
		}
	    }
	    real_term_wgts = new_term_wgts;
	}
	else {
	    real_term_wgts = term_wgts;
	    new_term_wgts[1] = NULL;
	}

	max_dev = (step == 0) ? vwgt_max : 5 * vwgt_max;
	goal_weight = 0;
	for (i = 0; i < nsets; i++) {
	    goal_weight += real_goal[i];
	}
	goal_weight *= KL_IMBALANCE / nsets;
	if (goal_weight > max_dev) {
	    max_dev = goal_weight;
	}

	if (!COARSEN_VWGTS) {
	    count_weights(graph, nvtxs, assignment, nsets, weights,
		(vwgt_max != 1));
	}

	klspiff(graph, nvtxs, assignment, nsets, hops, real_goal,
		real_term_wgts, max_dev, maxdeg, using_ewgts,
		&bndy_list, weights);

	if (real_term_wgts != term_wgts && new_term_wgts[1] != NULL) {
	    sfree((char *) real_term_wgts[1]);
	}

	if (LIMIT_KL_EWGTS)
	    restore_ewgts(graph, nvtxs);
    }
    *pbndy_list = bndy_list;

    if (ccoords != NULL) {
        for (i = 0; i < igeom; i++)
            sfree((char *) ccoords[i]);
        sfree((char *) ccoords);
    }

    if (DEBUG_COARSEN > 0) {
	printf(" Leaving coarsen_kl, step=%d\n", step);
    }
}


syntax highlighted by Code2HTML, v. 0.9.1