src/cv/bsdfmesh.c

#ifndef lint
static const char RCSid[] = "$Id: bsdfmesh.c,v 2.10 2013/09/26 14:57:18 greg Exp $";
#endif
/*
 * Create BSDF advection mesh from radial basis functions.
 *
 *      G. Ward
 */

#ifndef _WIN32
#include <unistd.h>
#include <sys/wait.h>
#include <sys/mman.h>
#endif
#define _USE_MATH_DEFINES
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <math.h>
#include "bsdfrep.h"
                                /* number of processes to run */
int                     nprocs = 1;
                                /* number of children (-1 in child) */
static int              nchild = 0;

typedef struct {
        int             nrows, ncols;   /* array size (matches migration) */
        float           *price;         /* migration prices */
        short           *sord;          /* sort for each row, low to high */
        float           *prow;          /* current price row */
} PRICEMAT;                     /* sorted pricing matrix */

#define pricerow(p,i)   ((p)->price + (i)*(p)->ncols)
#define psortrow(p,i)   ((p)->sord + (i)*(p)->ncols)

/* Create a new migration holder (sharing memory for multiprocessing) */
static MIGRATION *
new_migration(RBFNODE *from_rbf, RBFNODE *to_rbf)
{
        size_t          memlen = sizeof(MIGRATION) +
                                sizeof(float)*(from_rbf->nrbf*to_rbf->nrbf - 1);
        MIGRATION       *newmig;
#ifdef _WIN32
        if (nprocs > 1)
                fprintf(stderr, "%s: warning - multiprocessing not supported\n",
                                progname);
        nprocs = 1;
        newmig = (MIGRATION *)malloc(memlen);
#else
        if (nprocs <= 1) {                      /* single process? */
                newmig = (MIGRATION *)malloc(memlen);
        } else {                                /* else need to share memory */
                newmig = (MIGRATION *)mmap(NULL, memlen, PROT_READ|PROT_WRITE,
                                                MAP_ANON|MAP_SHARED, -1, 0);
                if ((void *)newmig == MAP_FAILED)
                        newmig = NULL;
        }
#endif
        if (newmig == NULL) {
                fprintf(stderr, "%s: cannot allocate new migration\n", progname);
                exit(1);
        }
        newmig->rbfv[0] = from_rbf;
        newmig->rbfv[1] = to_rbf;
                                                /* insert in edge lists */
        newmig->enxt[0] = from_rbf->ejl;
        from_rbf->ejl = newmig;
        newmig->enxt[1] = to_rbf->ejl;
        to_rbf->ejl = newmig;
        newmig->next = mig_list;                /* push onto global list */
        return(mig_list = newmig);
}

#ifdef _WIN32
#define await_children(n)       (void)(n)
#define run_subprocess()        0
#define end_subprocess()        (void)0
#else

/* Wait for the specified number of child processes to complete */
static void
await_children(int n)
{
        int     exit_status = 0;

        if (n > nchild)
                n = nchild;
        while (n-- > 0) {
                int     status;
                if (wait(&status) < 0) {
                        fprintf(stderr, "%s: missing child(ren)!\n", progname);
                        nchild = 0;
                        break;
                }
                --nchild;
                if (status) {                   /* something wrong */
                        if ((status = WEXITSTATUS(status)))
                                exit_status = status;
                        else
                                exit_status += !exit_status;
                        fprintf(stderr, "%s: subprocess died\n", progname);
                        n = nchild;             /* wait for the rest */
                }
        }
        if (exit_status)
                exit(exit_status);
}

/* Start child process if multiprocessing selected */
static pid_t
run_subprocess(void)
{
        int     status;
        pid_t   pid;

        if (nprocs <= 1)                        /* any children requested? */
                return(0);
        await_children(nchild + 1 - nprocs);    /* free up child process */
        if ((pid = fork())) {
                if (pid < 0) {
                        fprintf(stderr, "%s: cannot fork subprocess\n",
                                        progname);
                        await_children(nchild);
                        exit(1);
                }
                ++nchild;                       /* subprocess started */
                return(pid);
        }
        nchild = -1;
        return(0);                              /* put child to work */
}

/* If we are in subprocess, call exit */
#define end_subprocess()        if (nchild < 0) _exit(0); else

#endif  /* ! _WIN32 */

/* Comparison routine needed for sorting price row */
static int
msrt_cmp(void *b, const void *p1, const void *p2)
{
        PRICEMAT        *pm = (PRICEMAT *)b;
        float           c1 = pm->prow[*(const short *)p1];
        float           c2 = pm->prow[*(const short *)p2];

        if (c1 > c2) return(1);
        if (c1 < c2) return(-1);
        return(0);
}

/* Compute (and allocate) migration price matrix for optimization */
static void
price_routes(PRICEMAT *pm, const RBFNODE *from_rbf, const RBFNODE *to_rbf)
{
        FVECT   *vto = (FVECT *)malloc(sizeof(FVECT) * to_rbf->nrbf);
        int     i, j;

        pm->nrows = from_rbf->nrbf;
        pm->ncols = to_rbf->nrbf;
        pm->price = (float *)malloc(sizeof(float) * pm->nrows*pm->ncols);
        pm->sord = (short *)malloc(sizeof(short) * pm->nrows*pm->ncols);
        
        if ((pm->price == NULL) | (pm->sord == NULL) | (vto == NULL)) {
                fprintf(stderr, "%s: Out of memory in migration_costs()\n",
                                progname);
                exit(1);
        }
        for (j = to_rbf->nrbf; j--; )           /* save repetitive ops. */
                ovec_from_pos(vto[j], to_rbf->rbfa[j].gx, to_rbf->rbfa[j].gy);

        for (i = from_rbf->nrbf; i--; ) {
            const double        from_ang = R2ANG(from_rbf->rbfa[i].crad);
            FVECT               vfrom;
            short               *srow;
            ovec_from_pos(vfrom, from_rbf->rbfa[i].gx, from_rbf->rbfa[i].gy);
            pm->prow = pricerow(pm,i);
            srow = psortrow(pm,i);
            for (j = to_rbf->nrbf; j--; ) {
                double          dprod = DOT(vfrom, vto[j]);
                pm->prow[j] = ((dprod >= 1.) ? .0 : acos(dprod)) +
                                fabs(R2ANG(to_rbf->rbfa[j].crad) - from_ang);
                srow[j] = j;
            }
            qsort_r(srow, pm->ncols, sizeof(short), pm, &msrt_cmp);
        }
        free(vto);
}

/* Free price matrix */
static void
free_routes(PRICEMAT *pm)
{
        free(pm->price); pm->price = NULL;
        free(pm->sord); pm->sord = NULL;
}

/* Compute minimum (optimistic) cost for moving the given source material */
static double
min_cost(double amt2move, const double *avail, const PRICEMAT *pm, int s)
{
        const short     *srow = psortrow(pm,s);
        const float     *prow = pricerow(pm,s);
        double          total_cost = 0;
        int             j;
                                                /* move cheapest first */
        for (j = 0; (j < pm->ncols) & (amt2move > FTINY); j++) {
                int     d = srow[j];
                double  amt = (amt2move < avail[d]) ? amt2move : avail[d];

                total_cost += amt * prow[d];
                amt2move -= amt;
        }
        return(total_cost);
}

/* Compare entries by moving price */
static int
rmovcmp(void *b, const void *p1, const void *p2)
{
        PRICEMAT        *pm = (PRICEMAT *)b;
        const short     *ij1 = (const short *)p1;
        const short     *ij2 = (const short *)p2;
        float           price_diff;

        if (ij1[1] < 0) return(ij2[1] >= 0);
        if (ij2[1] < 0) return(-1);
        price_diff = pricerow(pm,ij1[0])[ij1[1]] - pricerow(pm,ij2[0])[ij2[1]];
        if (price_diff > 0) return(1);
        if (price_diff < 0) return(-1);
        return(0);
}

/* Take a step in migration by choosing reasonable bucket to transfer */
static double
migration_step(MIGRATION *mig, double *src_rem, double *dst_rem, PRICEMAT *pm)
{
        const int       max2check = 100;
        const double    maxamt = 1./(double)pm->ncols;
        const double    minamt = maxamt*5e-6;
        double          *src_cost;
        short           (*rord)[2];
        struct {
                int     s, d;   /* source and destination */
                double  price;  /* price estimate per amount moved */
                double  amt;    /* amount we can move */
        } cur, best;
        int             r2check, i, ri;
        /*
         * Check cheapest available routes only -- a higher adjusted
         * destination price implies that another source is closer, so
         * we can hold off considering more expensive options until
         * some other (hopefully better) moves have been made.
         */
                                                /* most promising row order */
        rord = (short (*)[2])malloc(sizeof(short)*2*pm->nrows);
        if (rord == NULL)
                goto memerr;
        for (ri = pm->nrows; ri--; ) {
            rord[ri][0] = ri;
            rord[ri][1] = -1;
            if (src_rem[ri] <= minamt)          /* enough source material? */
                    continue;
            for (i = 0; i < pm->ncols; i++)
                if (dst_rem[ rord[ri][1] = psortrow(pm,ri)[i] ] > minamt)
                        break;
            if (i >= pm->ncols) {               /* moved all we can? */
                free(rord);
                return(.0);
            }
        }
        if (pm->nrows > max2check)              /* sort if too many sources */
                qsort_r(rord, pm->nrows, sizeof(short)*2, pm, &rmovcmp);
                                                /* allocate cost array */
        src_cost = (double *)malloc(sizeof(double)*pm->nrows);
        if (src_cost == NULL)
                goto memerr;
        for (i = pm->nrows; i--; )              /* starting costs for diff. */
                src_cost[i] = min_cost(src_rem[i], dst_rem, pm, i);
                                                /* find best source & dest. */
        best.s = best.d = -1; best.price = FHUGE; best.amt = 0;
        if ((r2check = pm->nrows) > max2check)
                r2check = max2check;            /* put a limit on search */
        for (ri = 0; ri < r2check; ri++) {      /* check each source row */
            double      cost_others = 0;
            cur.s = rord[ri][0];
            if ((cur.d = rord[ri][1]) < 0 ||
                        (cur.price = pricerow(pm,cur.s)[cur.d]) >= best.price) {
                if (pm->nrows > max2check) break;       /* sorted end */
                continue;                       /* else skip this one */
            }
            cur.amt = (src_rem[cur.s] < dst_rem[cur.d]) ?
                                src_rem[cur.s] : dst_rem[cur.d];
                                                /* don't just leave smidgen */
            if (cur.amt > maxamt*1.02) cur.amt = maxamt;
            dst_rem[cur.d] -= cur.amt;          /* add up opportunity costs */
            for (i = pm->nrows; i--; )
                if (i != cur.s)
                    cost_others += min_cost(src_rem[i], dst_rem, pm, i)
                                        - src_cost[i];
            dst_rem[cur.d] += cur.amt;          /* undo trial move */
            cur.price += cost_others/cur.amt;   /* adjust effective price */
            if (cur.price < best.price)         /* are we better than best? */
                best = cur;
        }
        free(src_cost);                         /* clean up */
        free(rord);
        if ((best.s < 0) | (best.d < 0))        /* nothing left to move? */
                return(.0);
                                                /* else make the actual move */
        mtx_coef(mig,best.s,best.d) += best.amt;
        src_rem[best.s] -= best.amt;
        dst_rem[best.d] -= best.amt;
        return(best.amt);
memerr:
        fprintf(stderr, "%s: Out of memory in migration_step()\n", progname);
        exit(1);
}

/* Compute and insert migration along directed edge (may fork child) */
static MIGRATION *
create_migration(RBFNODE *from_rbf, RBFNODE *to_rbf)
{
        const double    end_thresh = 5e-6;
        PRICEMAT        pmtx;
        MIGRATION       *newmig;
        double          *src_rem, *dst_rem;
        double          total_rem = 1., move_amt;
        int             i, j;
                                                /* check if exists already */
        for (newmig = from_rbf->ejl; newmig != NULL;
                        newmig = nextedge(from_rbf,newmig))
                if (newmig->rbfv[1] == to_rbf)
                        return(NULL);
                                                /* else allocate */
#ifdef DEBUG
        fprintf(stderr, "Building path from (theta,phi) (%.0f,%.0f) ",
                        get_theta180(from_rbf->invec),
                        get_phi360(from_rbf->invec));
        fprintf(stderr, "to (%.0f,%.0f) with %d x %d matrix\n",
                        get_theta180(to_rbf->invec),
                        get_phi360(to_rbf->invec), 
                        from_rbf->nrbf, to_rbf->nrbf);
#endif
        newmig = new_migration(from_rbf, to_rbf);
        if (run_subprocess())
                return(newmig);                 /* child continues */
        price_routes(&pmtx, from_rbf, to_rbf);
        src_rem = (double *)malloc(sizeof(double)*from_rbf->nrbf);
        dst_rem = (double *)malloc(sizeof(double)*to_rbf->nrbf);
        if ((src_rem == NULL) | (dst_rem == NULL)) {
                fprintf(stderr, "%s: Out of memory in create_migration()\n",
                                progname);
                exit(1);
        }
                                                /* starting quantities */
        memset(newmig->mtx, 0, sizeof(float)*from_rbf->nrbf*to_rbf->nrbf);
        for (i = from_rbf->nrbf; i--; )
                src_rem[i] = rbf_volume(&from_rbf->rbfa[i]) / from_rbf->vtotal;
        for (j = to_rbf->nrbf; j--; )
                dst_rem[j] = rbf_volume(&to_rbf->rbfa[j]) / to_rbf->vtotal;

        do {                                    /* move a bit at a time */
                move_amt = migration_step(newmig, src_rem, dst_rem, &pmtx);
                total_rem -= move_amt;
        } while ((total_rem > end_thresh) & (move_amt > 0));

        for (i = from_rbf->nrbf; i--; ) {       /* normalize final matrix */
            double      nf = rbf_volume(&from_rbf->rbfa[i]);
            if (nf <= FTINY) continue;
            nf = from_rbf->vtotal / nf;
            for (j = to_rbf->nrbf; j--; )
                mtx_coef(newmig,i,j) *= nf;     /* row now sums to 1.0 */
        }
        end_subprocess();                       /* exit here if subprocess */
        free_routes(&pmtx);                     /* free working arrays */
        free(src_rem);
        free(dst_rem);
        return(newmig);
}

/* Check if prospective vertex would create overlapping triangle */
static int
overlaps_tri(const RBFNODE *bv0, const RBFNODE *bv1, const RBFNODE *pv)
{
        const MIGRATION *ej;
        RBFNODE         *vother[2];
        int             im_rev;
                                                /* find shared edge in mesh */
        for (ej = pv->ejl; ej != NULL; ej = nextedge(pv,ej)) {
                const RBFNODE   *tv = opp_rbf(pv,ej);
                if (tv == bv0) {
                        im_rev = is_rev_tri(ej->rbfv[0]->invec,
                                        ej->rbfv[1]->invec, bv1->invec);
                        break;
                }
                if (tv == bv1) {
                        im_rev = is_rev_tri(ej->rbfv[0]->invec,
                                        ej->rbfv[1]->invec, bv0->invec);
                        break;
                }
        }
        if (!get_triangles(vother, ej))         /* triangle on same side? */
                return(0);
        return(vother[im_rev] != NULL);
}

/* Find context hull vertex to complete triangle (oriented call) */
static RBFNODE *
find_chull_vert(const RBFNODE *rbf0, const RBFNODE *rbf1)
{
        FVECT   vmid, vejn, vp;
        RBFNODE *rbf, *rbfbest = NULL;
        double  dprod, area2, bestarea2 = FHUGE, bestdprod = -.5;

        VSUB(vejn, rbf1->invec, rbf0->invec);
        VADD(vmid, rbf0->invec, rbf1->invec);
        if (normalize(vejn) == 0 || normalize(vmid) == 0)
                return(NULL);
                                                /* XXX exhaustive search */
        /* Find triangle with minimum rotation from perpendicular */
        for (rbf = dsf_list; rbf != NULL; rbf = rbf->next) {
                if ((rbf == rbf0) | (rbf == rbf1))
                        continue;
                tri_orient(vp, rbf0->invec, rbf1->invec, rbf->invec);
                if (DOT(vp, vmid) <= FTINY)
                        continue;               /* wrong orientation */
                area2 = .25*DOT(vp,vp);
                VSUB(vp, rbf->invec, rbf0->invec);
                dprod = -DOT(vp, vejn);
                VSUM(vp, vp, vejn, dprod);      /* above guarantees non-zero */
                dprod = DOT(vp, vmid) / VLEN(vp);
                if (dprod <= bestdprod + FTINY*(1 - 2*(area2 < bestarea2)))
                        continue;               /* found better already */
                if (overlaps_tri(rbf0, rbf1, rbf))
                        continue;               /* overlaps another triangle */
                rbfbest = rbf;
                bestdprod = dprod;              /* new one to beat */
                bestarea2 = area2;
        }
        return(rbfbest);
}

/* Create new migration edge and grow mesh recursively around it */
static void
mesh_from_edge(MIGRATION *edge)
{
        MIGRATION       *ej0, *ej1;
        RBFNODE         *tvert[2];
        
        if (edge == NULL)
                return;
                                                /* triangle on either side? */
        get_triangles(tvert, edge);
        if (tvert[0] == NULL) {                 /* grow mesh on right */
                tvert[0] = find_chull_vert(edge->rbfv[0], edge->rbfv[1]);
                if (tvert[0] != NULL) {
                        if (tvert[0]->ord > edge->rbfv[0]->ord)
                                ej0 = create_migration(edge->rbfv[0], tvert[0]);
                        else
                                ej0 = create_migration(tvert[0], edge->rbfv[0]);
                        if (tvert[0]->ord > edge->rbfv[1]->ord)
                                ej1 = create_migration(edge->rbfv[1], tvert[0]);
                        else
                                ej1 = create_migration(tvert[0], edge->rbfv[1]);
                        mesh_from_edge(ej0);
                        mesh_from_edge(ej1);
                }
        } else if (tvert[1] == NULL) {          /* grow mesh on left */
                tvert[1] = find_chull_vert(edge->rbfv[1], edge->rbfv[0]);
                if (tvert[1] != NULL) {
                        if (tvert[1]->ord > edge->rbfv[0]->ord)
                                ej0 = create_migration(edge->rbfv[0], tvert[1]);
                        else
                                ej0 = create_migration(tvert[1], edge->rbfv[0]);
                        if (tvert[1]->ord > edge->rbfv[1]->ord)
                                ej1 = create_migration(edge->rbfv[1], tvert[1]);
                        else
                                ej1 = create_migration(tvert[1], edge->rbfv[1]);
                        mesh_from_edge(ej0);
                        mesh_from_edge(ej1);
                }
        }
}
        
/* Build our triangle mesh from recorded RBFs */
void
build_mesh(void)
{
        double          best2 = M_PI*M_PI;
        RBFNODE         *shrt_edj[2];
        RBFNODE         *rbf0, *rbf1;
                                                /* check if isotropic */
        if (single_plane_incident) {
                for (rbf0 = dsf_list; rbf0 != NULL; rbf0 = rbf0->next)
                        if (rbf0->next != NULL)
                                create_migration(rbf0, rbf0->next);
                await_children(nchild);
                return;
        }
        shrt_edj[0] = shrt_edj[1] = NULL;       /* start w/ shortest edge */
        for (rbf0 = dsf_list; rbf0 != NULL; rbf0 = rbf0->next)
            for (rbf1 = rbf0->next; rbf1 != NULL; rbf1 = rbf1->next) {
                double  dist2 = 2. - 2.*DOT(rbf0->invec,rbf1->invec);
                if (dist2 < best2) {
                        shrt_edj[0] = rbf0;
                        shrt_edj[1] = rbf1;
                        best2 = dist2;
                }
        }
        if (shrt_edj[0] == NULL) {
                fprintf(stderr, "%s: Cannot find shortest edge\n", progname);
                exit(1);
        }
                                                /* build mesh from this edge */
        if (shrt_edj[0]->ord < shrt_edj[1]->ord)
                mesh_from_edge(create_migration(shrt_edj[0], shrt_edj[1]));
        else
                mesh_from_edge(create_migration(shrt_edj[1], shrt_edj[0]));
                                                /* complete migrations */
        await_children(nchild);
}
Revision:	2.11
Committed:	Thu Oct 24 16:11:37 2013 UTC (10 years, 5 months ago) by greg
Content type:	text/plain
Branch:	MAIN
Changes since 2.10:	+74 -34 lines
Log Message:	Sped up convergence on large systems by almost 3x
#	Content
1	#ifndef lint
2	static const char RCSid[] = "$Id: bsdfmesh.c,v 2.10 2013/09/26 14:57:18 greg Exp $";
3	#endif
4	/*
5	* Create BSDF advection mesh from radial basis functions.
6	*
7	* G. Ward
8	*/
9
10	#ifndef _WIN32
11	#include <unistd.h>
12	#include <sys/wait.h>
13	#include <sys/mman.h>
14	#endif
15	#define _USE_MATH_DEFINES
16	#include <stdio.h>
17	#include <stdlib.h>
18	#include <string.h>
19	#include <math.h>
20	#include "bsdfrep.h"
21	/* number of processes to run */
22	int nprocs = 1;
23	/* number of children (-1 in child) */
24	static int nchild = 0;
25
26	typedef struct {
27	int nrows, ncols; /* array size (matches migration) */
28	float price; / migration prices */
29	short sord; / sort for each row, low to high */
30	float prow; / current price row */
31	} PRICEMAT; /* sorted pricing matrix */
32
33	#define pricerow(p,i) ((p)->price + (i)*(p)->ncols)
34	#define psortrow(p,i) ((p)->sord + (i)*(p)->ncols)
35
36	/* Create a new migration holder (sharing memory for multiprocessing) */
37	static MIGRATION *
38	new_migration(RBFNODE from_rbf, RBFNODE to_rbf)
39	{
40	size_t memlen = sizeof(MIGRATION) +
41	sizeof(float)(from_rbf->nrbfto_rbf->nrbf - 1);
42	MIGRATION *newmig;
43	#ifdef _WIN32
44	if (nprocs > 1)
45	fprintf(stderr, "%s: warning - multiprocessing not supported\n",
46	progname);
47	nprocs = 1;
48	newmig = (MIGRATION *)malloc(memlen);
49	#else
50	if (nprocs <= 1) { /* single process? */
51	newmig = (MIGRATION *)malloc(memlen);
52	} else { /* else need to share memory */
53	newmig = (MIGRATION *)mmap(NULL, memlen, PROT_READ\|PROT_WRITE,
54	MAP_ANON\|MAP_SHARED, -1, 0);
55	if ((void *)newmig == MAP_FAILED)
56	newmig = NULL;
57	}
58	#endif
59	if (newmig == NULL) {
60	fprintf(stderr, "%s: cannot allocate new migration\n", progname);
61	exit(1);
62	}
63	newmig->rbfv[0] = from_rbf;
64	newmig->rbfv[1] = to_rbf;
65	/* insert in edge lists */
66	newmig->enxt[0] = from_rbf->ejl;
67	from_rbf->ejl = newmig;
68	newmig->enxt[1] = to_rbf->ejl;
69	to_rbf->ejl = newmig;
70	newmig->next = mig_list; /* push onto global list */
71	return(mig_list = newmig);
72	}
73
74	#ifdef _WIN32
75	#define await_children(n) (void)(n)
76	#define run_subprocess() 0
77	#define end_subprocess() (void)0
78	#else
79
80	/* Wait for the specified number of child processes to complete */
81	static void
82	await_children(int n)
83	{
84	int exit_status = 0;
85
86	if (n > nchild)
87	n = nchild;
88	while (n-- > 0) {
89	int status;
90	if (wait(&status) < 0) {
91	fprintf(stderr, "%s: missing child(ren)!\n", progname);
92	nchild = 0;
93	break;
94	}
95	--nchild;
96	if (status) { /* something wrong */
97	if ((status = WEXITSTATUS(status)))
98	exit_status = status;
99	else
100	exit_status += !exit_status;
101	fprintf(stderr, "%s: subprocess died\n", progname);
102	n = nchild; /* wait for the rest */
103	}
104	}
105	if (exit_status)
106	exit(exit_status);
107	}
108
109	/* Start child process if multiprocessing selected */
110	static pid_t
111	run_subprocess(void)
112	{
113	int status;
114	pid_t pid;
115
116	if (nprocs <= 1) /* any children requested? */
117	return(0);
118	await_children(nchild + 1 - nprocs); /* free up child process */
119	if ((pid = fork())) {
120	if (pid < 0) {
121	fprintf(stderr, "%s: cannot fork subprocess\n",
122	progname);
123	await_children(nchild);
124	exit(1);
125	}
126	++nchild; /* subprocess started */
127	return(pid);
128	}
129	nchild = -1;
130	return(0); /* put child to work */
131	}
132
133	/* If we are in subprocess, call exit */
134	#define end_subprocess() if (nchild < 0) _exit(0); else
135
136	#endif /* ! _WIN32 */
137
138	/* Comparison routine needed for sorting price row */
139	static int
140	msrt_cmp(void b, const void p1, const void *p2)
141	{
142	PRICEMAT pm = (PRICEMAT )b;
143	float c1 = pm->prow[(const short )p1];
144	float c2 = pm->prow[(const short )p2];
145
146	if (c1 > c2) return(1);
147	if (c1 < c2) return(-1);
148	return(0);
149	}
150
151	/* Compute (and allocate) migration price matrix for optimization */
152	static void
153	price_routes(PRICEMAT pm, const RBFNODE from_rbf, const RBFNODE *to_rbf)
154	{
155	FVECT vto = (FVECT )malloc(sizeof(FVECT) * to_rbf->nrbf);
156	int i, j;
157
158	pm->nrows = from_rbf->nrbf;
159	pm->ncols = to_rbf->nrbf;
160	pm->price = (float )malloc(sizeof(float) pm->nrows*pm->ncols);
161	pm->sord = (short )malloc(sizeof(short) pm->nrows*pm->ncols);
162
163	if ((pm->price == NULL) \| (pm->sord == NULL) \| (vto == NULL)) {
164	fprintf(stderr, "%s: Out of memory in migration_costs()\n",
165	progname);
166	exit(1);
167	}
168	for (j = to_rbf->nrbf; j--; ) /* save repetitive ops. */
169	ovec_from_pos(vto[j], to_rbf->rbfa[j].gx, to_rbf->rbfa[j].gy);
170
171	for (i = from_rbf->nrbf; i--; ) {
172	const double from_ang = R2ANG(from_rbf->rbfa[i].crad);
173	FVECT vfrom;
174	short *srow;
175	ovec_from_pos(vfrom, from_rbf->rbfa[i].gx, from_rbf->rbfa[i].gy);
176	pm->prow = pricerow(pm,i);
177	srow = psortrow(pm,i);
178	for (j = to_rbf->nrbf; j--; ) {
179	double dprod = DOT(vfrom, vto[j]);
180	pm->prow[j] = ((dprod >= 1.) ? .0 : acos(dprod)) +
181	fabs(R2ANG(to_rbf->rbfa[j].crad) - from_ang);
182	srow[j] = j;
183	}
184	qsort_r(srow, pm->ncols, sizeof(short), pm, &msrt_cmp);
185	}
186	free(vto);
187	}
188
189	/* Free price matrix */
190	static void
191	free_routes(PRICEMAT *pm)
192	{
193	free(pm->price); pm->price = NULL;
194	free(pm->sord); pm->sord = NULL;
195	}
196
197	/* Compute minimum (optimistic) cost for moving the given source material */
198	static double
199	min_cost(double amt2move, const double avail, const PRICEMAT pm, int s)
200	{
201	const short *srow = psortrow(pm,s);
202	const float *prow = pricerow(pm,s);
203	double total_cost = 0;
204	int j;
205	/* move cheapest first */
206	for (j = 0; (j < pm->ncols) & (amt2move > FTINY); j++) {
207	int d = srow[j];
208	double amt = (amt2move < avail[d]) ? amt2move : avail[d];
209
210	total_cost += amt * prow[d];
211	amt2move -= amt;
212	}
213	return(total_cost);
214	}
215
216	/* Compare entries by moving price */
217	static int
218	rmovcmp(void b, const void p1, const void *p2)
219	{
220	PRICEMAT pm = (PRICEMAT )b;
221	const short ij1 = (const short )p1;
222	const short ij2 = (const short )p2;
223	float price_diff;
224
225	if (ij1[1] < 0) return(ij2[1] >= 0);
226	if (ij2[1] < 0) return(-1);
227	price_diff = pricerow(pm,ij1[0])[ij1[1]] - pricerow(pm,ij2[0])[ij2[1]];
228	if (price_diff > 0) return(1);
229	if (price_diff < 0) return(-1);
230	return(0);
231	}
232
233	/* Take a step in migration by choosing reasonable bucket to transfer */
234	static double
235	migration_step(MIGRATION mig, double src_rem, double dst_rem, PRICEMAT pm)
236	{
237	const int max2check = 100;
238	const double maxamt = 1./(double)pm->ncols;
239	const double minamt = maxamt*5e-6;
240	double *src_cost;
241	short (*rord)[2];
242	struct {
243	int s, d; /* source and destination */
244	double price; /* price estimate per amount moved */
245	double amt; /* amount we can move */
246	} cur, best;
247	int r2check, i, ri;
248	/*
249	* Check cheapest available routes only -- a higher adjusted
250	* destination price implies that another source is closer, so
251	* we can hold off considering more expensive options until
252	* some other (hopefully better) moves have been made.
253	*/
254	/* most promising row order */
255	rord = (short ()[2])malloc(sizeof(short)2*pm->nrows);
256	if (rord == NULL)
257	goto memerr;
258	for (ri = pm->nrows; ri--; ) {
259	rord[ri][0] = ri;
260	rord[ri][1] = -1;
261	if (src_rem[ri] <= minamt) /* enough source material? */
262	continue;
263	for (i = 0; i < pm->ncols; i++)
264	if (dst_rem[ rord[ri][1] = psortrow(pm,ri)[i] ] > minamt)
265	break;
266	if (i >= pm->ncols) { /* moved all we can? */
267	free(rord);
268	return(.0);
269	}
270	}
271	if (pm->nrows > max2check) /* sort if too many sources */
272	qsort_r(rord, pm->nrows, sizeof(short)*2, pm, &rmovcmp);
273	/* allocate cost array */
274	src_cost = (double )malloc(sizeof(double)pm->nrows);
275	if (src_cost == NULL)
276	goto memerr;
277	for (i = pm->nrows; i--; ) /* starting costs for diff. */
278	src_cost[i] = min_cost(src_rem[i], dst_rem, pm, i);
279	/* find best source & dest. */
280	best.s = best.d = -1; best.price = FHUGE; best.amt = 0;
281	if ((r2check = pm->nrows) > max2check)
282	r2check = max2check; /* put a limit on search */
283	for (ri = 0; ri < r2check; ri++) { /* check each source row */
284	double cost_others = 0;
285	cur.s = rord[ri][0];
286	if ((cur.d = rord[ri][1]) < 0 \|\|
287	(cur.price = pricerow(pm,cur.s)[cur.d]) >= best.price) {
288	if (pm->nrows > max2check) break; /* sorted end */
289	continue; /* else skip this one */
290	}
291	cur.amt = (src_rem[cur.s] < dst_rem[cur.d]) ?
292	src_rem[cur.s] : dst_rem[cur.d];
293	/* don't just leave smidgen */
294	if (cur.amt > maxamt*1.02) cur.amt = maxamt;
295	dst_rem[cur.d] -= cur.amt; /* add up opportunity costs */
296	for (i = pm->nrows; i--; )
297	if (i != cur.s)
298	cost_others += min_cost(src_rem[i], dst_rem, pm, i)
299	- src_cost[i];
300	dst_rem[cur.d] += cur.amt; /* undo trial move */
301	cur.price += cost_others/cur.amt; /* adjust effective price */
302	if (cur.price < best.price) /* are we better than best? */
303	best = cur;
304	}
305	free(src_cost); /* clean up */
306	free(rord);
307	if ((best.s < 0) \| (best.d < 0)) /* nothing left to move? */
308	return(.0);
309	/* else make the actual move */
310	mtx_coef(mig,best.s,best.d) += best.amt;
311	src_rem[best.s] -= best.amt;
312	dst_rem[best.d] -= best.amt;
313	return(best.amt);
314	memerr:
315	fprintf(stderr, "%s: Out of memory in migration_step()\n", progname);
316	exit(1);
317	}
318
319	/* Compute and insert migration along directed edge (may fork child) */
320	static MIGRATION *
321	create_migration(RBFNODE from_rbf, RBFNODE to_rbf)
322	{
323	const double end_thresh = 5e-6;
324	PRICEMAT pmtx;
325	MIGRATION *newmig;
326	double src_rem, dst_rem;
327	double total_rem = 1., move_amt;
328	int i, j;
329	/* check if exists already */
330	for (newmig = from_rbf->ejl; newmig != NULL;
331	newmig = nextedge(from_rbf,newmig))
332	if (newmig->rbfv[1] == to_rbf)
333	return(NULL);
334	/* else allocate */
335	#ifdef DEBUG
336	fprintf(stderr, "Building path from (theta,phi) (%.0f,%.0f) ",
337	get_theta180(from_rbf->invec),
338	get_phi360(from_rbf->invec));
339	fprintf(stderr, "to (%.0f,%.0f) with %d x %d matrix\n",
340	get_theta180(to_rbf->invec),
341	get_phi360(to_rbf->invec),
342	from_rbf->nrbf, to_rbf->nrbf);
343	#endif
344	newmig = new_migration(from_rbf, to_rbf);
345	if (run_subprocess())
346	return(newmig); /* child continues */
347	price_routes(&pmtx, from_rbf, to_rbf);
348	src_rem = (double )malloc(sizeof(double)from_rbf->nrbf);
349	dst_rem = (double )malloc(sizeof(double)to_rbf->nrbf);
350	if ((src_rem == NULL) \| (dst_rem == NULL)) {
351	fprintf(stderr, "%s: Out of memory in create_migration()\n",
352	progname);
353	exit(1);
354	}
355	/* starting quantities */
356	memset(newmig->mtx, 0, sizeof(float)from_rbf->nrbfto_rbf->nrbf);
357	for (i = from_rbf->nrbf; i--; )
358	src_rem[i] = rbf_volume(&from_rbf->rbfa[i]) / from_rbf->vtotal;
359	for (j = to_rbf->nrbf; j--; )
360	dst_rem[j] = rbf_volume(&to_rbf->rbfa[j]) / to_rbf->vtotal;
361
362	do { /* move a bit at a time */
363	move_amt = migration_step(newmig, src_rem, dst_rem, &pmtx);
364	total_rem -= move_amt;
365	} while ((total_rem > end_thresh) & (move_amt > 0));
366
367	for (i = from_rbf->nrbf; i--; ) { /* normalize final matrix */
368	double nf = rbf_volume(&from_rbf->rbfa[i]);
369	if (nf <= FTINY) continue;
370	nf = from_rbf->vtotal / nf;
371	for (j = to_rbf->nrbf; j--; )
372	mtx_coef(newmig,i,j) = nf; / row now sums to 1.0 */
373	}
374	end_subprocess(); /* exit here if subprocess */
375	free_routes(&pmtx); /* free working arrays */
376	free(src_rem);
377	free(dst_rem);
378	return(newmig);
379	}
380
381	/* Check if prospective vertex would create overlapping triangle */
382	static int
383	overlaps_tri(const RBFNODE bv0, const RBFNODE bv1, const RBFNODE *pv)
384	{
385	const MIGRATION *ej;
386	RBFNODE *vother[2];
387	int im_rev;
388	/* find shared edge in mesh */
389	for (ej = pv->ejl; ej != NULL; ej = nextedge(pv,ej)) {
390	const RBFNODE *tv = opp_rbf(pv,ej);
391	if (tv == bv0) {
392	im_rev = is_rev_tri(ej->rbfv[0]->invec,
393	ej->rbfv[1]->invec, bv1->invec);
394	break;
395	}
396	if (tv == bv1) {
397	im_rev = is_rev_tri(ej->rbfv[0]->invec,
398	ej->rbfv[1]->invec, bv0->invec);
399	break;
400	}
401	}
402	if (!get_triangles(vother, ej)) /* triangle on same side? */
403	return(0);
404	return(vother[im_rev] != NULL);
405	}
406
407	/* Find context hull vertex to complete triangle (oriented call) */
408	static RBFNODE *
409	find_chull_vert(const RBFNODE rbf0, const RBFNODE rbf1)
410	{
411	FVECT vmid, vejn, vp;
412	RBFNODE rbf, rbfbest = NULL;
413	double dprod, area2, bestarea2 = FHUGE, bestdprod = -.5;
414
415	VSUB(vejn, rbf1->invec, rbf0->invec);
416	VADD(vmid, rbf0->invec, rbf1->invec);
417	if (normalize(vejn) == 0 \|\| normalize(vmid) == 0)
418	return(NULL);
419	/* XXX exhaustive search */
420	/* Find triangle with minimum rotation from perpendicular */
421	for (rbf = dsf_list; rbf != NULL; rbf = rbf->next) {
422	if ((rbf == rbf0) \| (rbf == rbf1))
423	continue;
424	tri_orient(vp, rbf0->invec, rbf1->invec, rbf->invec);
425	if (DOT(vp, vmid) <= FTINY)
426	continue; /* wrong orientation */
427	area2 = .25*DOT(vp,vp);
428	VSUB(vp, rbf->invec, rbf0->invec);
429	dprod = -DOT(vp, vejn);
430	VSUM(vp, vp, vejn, dprod); /* above guarantees non-zero */
431	dprod = DOT(vp, vmid) / VLEN(vp);
432	if (dprod <= bestdprod + FTINY(1 - 2(area2 < bestarea2)))
433	continue; /* found better already */
434	if (overlaps_tri(rbf0, rbf1, rbf))
435	continue; /* overlaps another triangle */
436	rbfbest = rbf;
437	bestdprod = dprod; /* new one to beat */
438	bestarea2 = area2;
439	}
440	return(rbfbest);
441	}
442
443	/* Create new migration edge and grow mesh recursively around it */
444	static void
445	mesh_from_edge(MIGRATION *edge)
446	{
447	MIGRATION ej0, ej1;
448	RBFNODE *tvert[2];
449
450	if (edge == NULL)
451	return;
452	/* triangle on either side? */
453	get_triangles(tvert, edge);
454	if (tvert[0] == NULL) { /* grow mesh on right */
455	tvert[0] = find_chull_vert(edge->rbfv[0], edge->rbfv[1]);
456	if (tvert[0] != NULL) {
457	if (tvert[0]->ord > edge->rbfv[0]->ord)
458	ej0 = create_migration(edge->rbfv[0], tvert[0]);
459	else
460	ej0 = create_migration(tvert[0], edge->rbfv[0]);
461	if (tvert[0]->ord > edge->rbfv[1]->ord)
462	ej1 = create_migration(edge->rbfv[1], tvert[0]);
463	else
464	ej1 = create_migration(tvert[0], edge->rbfv[1]);
465	mesh_from_edge(ej0);
466	mesh_from_edge(ej1);
467	}
468	} else if (tvert[1] == NULL) { /* grow mesh on left */
469	tvert[1] = find_chull_vert(edge->rbfv[1], edge->rbfv[0]);
470	if (tvert[1] != NULL) {
471	if (tvert[1]->ord > edge->rbfv[0]->ord)
472	ej0 = create_migration(edge->rbfv[0], tvert[1]);
473	else
474	ej0 = create_migration(tvert[1], edge->rbfv[0]);
475	if (tvert[1]->ord > edge->rbfv[1]->ord)
476	ej1 = create_migration(edge->rbfv[1], tvert[1]);
477	else
478	ej1 = create_migration(tvert[1], edge->rbfv[1]);
479	mesh_from_edge(ej0);
480	mesh_from_edge(ej1);
481	}
482	}
483	}
484
485	/* Build our triangle mesh from recorded RBFs */
486	void
487	build_mesh(void)
488	{
489	double best2 = M_PI*M_PI;
490	RBFNODE *shrt_edj[2];
491	RBFNODE rbf0, rbf1;
492	/* check if isotropic */
493	if (single_plane_incident) {
494	for (rbf0 = dsf_list; rbf0 != NULL; rbf0 = rbf0->next)
495	if (rbf0->next != NULL)
496	create_migration(rbf0, rbf0->next);
497	await_children(nchild);
498	return;
499	}
500	shrt_edj[0] = shrt_edj[1] = NULL; /* start w/ shortest edge */
501	for (rbf0 = dsf_list; rbf0 != NULL; rbf0 = rbf0->next)
502	for (rbf1 = rbf0->next; rbf1 != NULL; rbf1 = rbf1->next) {
503	double dist2 = 2. - 2.*DOT(rbf0->invec,rbf1->invec);
504	if (dist2 < best2) {
505	shrt_edj[0] = rbf0;
506	shrt_edj[1] = rbf1;
507	best2 = dist2;
508	}
509	}
510	if (shrt_edj[0] == NULL) {
511	fprintf(stderr, "%s: Cannot find shortest edge\n", progname);
512	exit(1);
513	}
514	/* build mesh from this edge */
515	if (shrt_edj[0]->ord < shrt_edj[1]->ord)
516	mesh_from_edge(create_migration(shrt_edj[0], shrt_edj[1]));
517	else
518	mesh_from_edge(create_migration(shrt_edj[1], shrt_edj[0]));
519	/* complete migrations */
520	await_children(nchild);
521	}