[ViewVC] Diff of: Development/ray/src/rt/ambcomp.c

Comparing ray/src/rt/ambcomp.c (file contents):
Revision 2.28 by greg, Sat Apr 19 19:20:47 2014 UTC vs.
Revision 2.54 by greg, Fri May 9 04:55:19 2014 UTC

+ *      for Irradiance Caching" by Schwarzhaupt, Wann Jensen, & Jarosz
+ *      from ACM SIGGRAPH Asia 2012 conference proceedings.
-+
+ *  Added book-keeping optimization to avoid calculations that would
-+
+ *      cancel due to traversal both directions on edges that are adjacent
-+
+ *      to same-valued triangles.  This cuts about half of Hessian math.
-+
+ *
+ *  Declarations of external symbols in ambient.h
+ */
+extern void             SDsquare2disk(double ds[2], double seedx, double seedy);
-+
+                                /* vertex direction bit positions */
-+
+#define VDB_xy  0
-+
+#define VDB_y   01
-+
+#define VDB_x   02
-+
+#define VDB_Xy  03
-+
+#define VDB_xY  04
-+
+#define VDB_X   05
-+
+#define VDB_Y   06
-+
+#define VDB_XY  07
-+
+                                /* get opposite vertex direction bit */
-+
+#define VDB_OPP(f)      (~(f) & 07)
-+
+                                /* adjacent triangle vertex flags */
-+
+static const int  adjacent_trifl[8] = {
-+
+,                      /* forbidden diagonal */
-+
+<<VDB_x|1<<VDB_y|1<<VDB_Xy,
-+
+<<VDB_y|1<<VDB_x|1<<VDB_xY,
-+
+<<VDB_y|1<<VDB_Xy|1<<VDB_X,
-+
+<<VDB_x|1<<VDB_xY|1<<VDB_Y,
-+
+<<VDB_Xy|1<<VDB_X|1<<VDB_Y,
-+
+<<VDB_xY|1<<VDB_Y|1<<VDB_X,
-+
+,                      /* forbidden diagonal */
-+
+                };
-+
+typedef struct {
-+
+        COLOR   v;              /* hemisphere sample value */
-+
+        float   d;              /* reciprocal distance (1/rt) */
-+
+        FVECT   p;              /* intersection point */
-+
+} AMBSAMP;              /* sample value */
-+
-+
+typedef struct {
+        RAY     *rp;            /* originating ray sample */
+        FVECT   ux, uy;         /* tangent axis unit vectors */
+        int     ns;             /* number of samples per axis */
+        COLOR   acoef;          /* division contribution coefficient */
-<
+        struct s_ambsamp {
-<
+                COLOR   v;              /* hemisphere sample value */
-<
+                float   p[3];           /* intersection point */
-<
+        } sa[1];                /* sample array (extends struct) */
->
+        AMBSAMP sa[1];          /* sample array (extends struct) */
+}  AMBHEMI;             /* ambient sample hemisphere */
-<
+#define ambsamp(h,i,j)  (h)->sa[(i)*(h)->ns + (j)]
->
+#define ambndx(h,i,j)   ((i)*(h)->ns + (j))
->
+#define ambsam(h,i,j)   (h)->sa[ambndx(h,i,j)]
+typedef struct {
-<
+        FVECT   r_i, r_i1, e_i;
-<
+        double  nf, I1, I2, J2;
->
+        FVECT   r_i, r_i1, e_i, rcp, rI2_eJ2;
->
+        double  I1, I2;
->
+        int     valid;
+} FFTRI;                /* vectors and coefficients for Hessian calculation */
-+
+/* Get index for adjacent vertex */
-+
+static int
-+
+adjacent_verti(AMBHEMI *hp, int i, int j, int dbit)
-+
+{
-+
+        int     i0 = i*hp->ns + j;
-+
-+
+        switch (dbit) {
-+
+        case VDB_y:     return(i0 - hp->ns);
-+
+        case VDB_x:     return(i0 - 1);
-+
+        case VDB_Xy:    return(i0 - hp->ns + 1);
-+
+        case VDB_xY:    return(i0 + hp->ns - 1);
-+
+        case VDB_X:     return(i0 + 1);
-+
+        case VDB_Y:     return(i0 + hp->ns);
-+
+                                /* the following should never occur */
-+
+        case VDB_xy:    return(i0 - hp->ns - 1);
-+
+        case VDB_XY:    return(i0 + hp->ns + 1);
-+
+        }
-+
+        return(-1);
-+
+}
-+
-+
-+
+/* Get vertex direction bit for the opposite edge to complete triangle */
-+
+static int
-+
+vdb_edge(int db1, int db2)
-+
+{
-+
+        switch (db1) {
-+
+        case VDB_x:     return(db2==VDB_y ? VDB_Xy : VDB_Y);
-+
+        case VDB_y:     return(db2==VDB_x ? VDB_xY : VDB_X);
-+
+        case VDB_X:     return(db2==VDB_Xy ? VDB_y : VDB_xY);
-+
+        case VDB_Y:     return(db2==VDB_xY ? VDB_x : VDB_Xy);
-+
+        case VDB_xY:    return(db2==VDB_x ? VDB_y : VDB_X);
-+
+        case VDB_Xy:    return(db2==VDB_y ? VDB_x : VDB_Y);
-+
+        }
-+
+        error(CONSISTENCY, "forbidden diagonal in vdb_edge()");
-+
+        return(-1);
-+
+}
-+
-+
+static AMBHEMI *
+inithemi(                       /* initialize sampling hemisphere */
+        COLOR   ac,
+        if (n < i)
+                n = i;
+                                        /* allocate sampling array */
-<
+        hp = (AMBHEMI *)malloc(sizeof(AMBHEMI) +
-<
+                                sizeof(struct s_ambsamp)*(n*n - 1));
->
+        hp = (AMBHEMI *)malloc(sizeof(AMBHEMI) + sizeof(AMBSAMP)*(n*n - 1));
+        if (hp == NULL)
+                return(NULL);
+        hp->rp = r;
+        d = 1.0/(n*n);
+        scalecolor(hp->acoef, d);
+                                        /* make tangent plane axes */
-<
+        hp->uy[0] = 0.1 - 0.2*frandom();
-<
+        hp->uy[1] = 0.1 - 0.2*frandom();
-<
+        hp->uy[2] = 0.1 - 0.2*frandom();
-<
+        for (i = 0; i < 3; i++)
-<
+                if (r->ron[i] < 0.6 && r->ron[i] > -0.6)
->
+        hp->uy[0] = 0.5 - frandom();
->
+        hp->uy[1] = 0.5 - frandom();
->
+        hp->uy[2] = 0.5 - frandom();
->
+        for (i = 3; i--; )
->
+                if ((-0.6 < r->ron[i]) & (r->ron[i] < 0.6))
+                        break;
-<
+        if (i >= 3)
-<
+                error(CONSISTENCY, "bad ray direction in inithemi()");
->
+        if (i < 0)
->
+                error(CONSISTENCY, "bad ray direction in inithemi");
+        hp->uy[i] = 1.0;
+        VCROSS(hp->ux, hp->uy, r->ron);
+        normalize(hp->ux);
-<
+static struct s_ambsamp *
-<
+ambsample(                              /* sample an ambient direction */
-<
+        AMBHEMI *hp,
-<
+        int     i,
-<
+        int     j
-<
+)
->
+/* Sample ambient division and apply weighting coefficient */
->
+static int
->
+getambsamp(RAY *arp, AMBHEMI *hp, int i, int j, int n)
-<
+        struct s_ambsamp        *ap = &ambsamp(hp,i,j);
-<
+        RAY                     ar;
-<
+        int                     hlist[3];
-<
+        double                  spt[2], zd;
-<
+        int                     ii;
->
+        int     hlist[3], ii;
->
+        double  spt[2], zd;
+                                        /* ambient coefficient for weight */
+        if (ambacc > FTINY)
-<
+                setcolor(ar.rcoef, AVGREFL, AVGREFL, AVGREFL);
->
+                setcolor(arp->rcoef, AVGREFL, AVGREFL, AVGREFL);
+        else
-<
+                copycolor(ar.rcoef, hp->acoef);
-<
+        if (rayorigin(&ar, AMBIENT, hp->rp, ar.rcoef) < 0) {
-<
+                setcolor(ap->v, 0., 0., 0.);
-<
+                VCOPY(ap->p, hp->rp->rop);
-<
+                return(NULL);           /* no sample taken */
-<
+        }
->
+                copycolor(arp->rcoef, hp->acoef);
->
+        if (rayorigin(arp, AMBIENT, hp->rp, arp->rcoef) < 0)
->
+                return(0);
+        if (ambacc > FTINY) {
-<
+                multcolor(ar.rcoef, hp->acoef);
-<
+                scalecolor(ar.rcoef, 1./AVGREFL);
->
+                multcolor(arp->rcoef, hp->acoef);
->
+                scalecolor(arp->rcoef, 1./AVGREFL);
-<
+                                        /* generate hemispherical sample */
-<
+        SDsquare2disk(spt,      (i+.1+.8*frandom())/hp->ns,
-<
+                                (j+.1+.8*frandom())/hp->ns );
->
+        hlist[0] = hp->rp->rno;
->
+        hlist[1] = j;
->
+        hlist[2] = i;
->
+        multisamp(spt, 2, urand(ilhash(hlist,3)+n));
->
+        if (!n) {                       /* avoid border samples for n==0 */
->
+                if ((spt[0] < 0.1) | (spt[0] >= 0.9))
->
+                        spt[0] = 0.1 + 0.8*frandom();
->
+                if ((spt[1] < 0.1) | (spt[1] >= 0.9))
->
+                        spt[1] = 0.1 + 0.8*frandom();
->
+        }
->
+        SDsquare2disk(spt, (j+spt[1])/hp->ns, (i+spt[0])/hp->ns);
+        zd = sqrt(1. - spt[0]*spt[0] - spt[1]*spt[1]);
+        for (ii = 3; ii--; )
-<
+                ar.rdir[ii] =   spt[0]*hp->ux[ii] +
->
+                arp->rdir[ii] = spt[0]*hp->ux[ii] +
+                                spt[1]*hp->uy[ii] +
+                                zd*hp->rp->ron[ii];
-<
+        checknorm(ar.rdir);
-<
+        dimlist[ndims++] = i*hp->ns + j + 90171;
-<
+        rayvalue(&ar);                  /* evaluate ray */
-<
+        ndims--;
-<
+        multcolor(ar.rcol, ar.rcoef);   /* apply coefficient */
-<
+        copycolor(ap->v, ar.rcol);
-<
+        if (ar.rt > 20.0*maxarad)       /* limit vertex distance */
-<
+                ar.rt = 20.0*maxarad;
->
+        checknorm(arp->rdir);
->
+        dimlist[ndims++] = ambndx(hp,i,j) + 90171;
->
+        rayvalue(arp);                  /* evaluate ray */
->
+        ndims--;                        /* apply coefficient */
->
+        multcolor(arp->rcol, arp->rcoef);
->
+        return(1);
->
+}
->
->
->
+static AMBSAMP *
->
+ambsample(                              /* initial ambient division sample */
->
+        AMBHEMI *hp,
->
+        int     i,
->
+        int     j
->
+)
->
+{
->
+        AMBSAMP *ap = &ambsam(hp,i,j);
->
+        RAY     ar;
->
+                                        /* generate hemispherical sample */
->
+        if (!getambsamp(&ar, hp, i, j, 0) || ar.rt <= FTINY) {
->
+                memset(ap, 0, sizeof(AMBSAMP));
->
+                return(NULL);
->
+        }
->
+        ap->d = 1.0/ar.rt;              /* limit vertex distance */
->
+        if (ar.rt > 10.0*thescene.cusize)
->
+                ar.rt = 10.0*thescene.cusize;
+        VSUM(ap->p, ar.rorg, ar.rdir, ar.rt);
-+
+        copycolor(ap->v, ar.rcol);
+        return(ap);
-+
+/* Estimate errors based on ambient division differences */
-+
+static float *
-+
+getambdiffs(AMBHEMI *hp)
-+
+{
-+
+        float   *earr = (float *)malloc(sizeof(float)*hp->ns*hp->ns);
-+
+        float   *ep;
-+
+        AMBSAMP *ap;
-+
+        double  b, d2;
-+
+        int     i, j;
-+
-+
+        if (earr == NULL)               /* out of memory? */
-+
+                return(NULL);
-+
+                                        /* compute squared neighbor diffs */
-+
+        for (ap = hp->sa, ep = earr, i = 0; i < hp->ns; i++)
-+
+            for (j = 0; j < hp->ns; j++, ap++, ep++) {
-+
+                ep[0] = FTINY;
-+
+                b = bright(ap[0].v);
-+
+                if (i) {                /* from above */
-+
+                        d2 = b - bright(ap[-hp->ns].v);
-+
+                        d2 *= d2;
-+
+                        ep[0] += d2;
-+
+                        ep[-hp->ns] += d2;
-+
+                }
-+
+                if (j) {                /* from behind */
-+
+                        d2 = b - bright(ap[-1].v);
-+
+                        d2 *= d2;
-+
+                        ep[0] += d2;
-+
+                        ep[-1] += d2;
-+
+                }
-+
+            }
-+
+                                        /* correct for number of neighbors */
-+
+        earr[0] *= 2.f;
-+
+        earr[hp->ns-1] *= 2.f;
-+
+        earr[(hp->ns-1)*hp->ns] *= 2.f;
-+
+        earr[(hp->ns-1)*hp->ns + hp->ns-1] *= 2.f;
-+
+        for (i = 1; i < hp->ns-1; i++) {
-+
+                earr[i*hp->ns] *= 4./3.;
-+
+                earr[i*hp->ns + hp->ns-1] *= 4./3.;
-+
+        }
-+
+        for (j = 1; j < hp->ns-1; j++) {
-+
+                earr[j] *= 4./3.;
-+
+                earr[(hp->ns-1)*hp->ns + j] *= 4./3.;
-+
+        }
-+
+        return(earr);
-+
+}
-+
-+
-+
+/* Perform super-sampling on hemisphere (introduces bias) */
-+
+static void
-+
+ambsupersamp(double acol[3], AMBHEMI *hp, int cnt)
-+
+{
-+
+        float   *earr = getambdiffs(hp);
-+
+        double  e2rem = 0;
-+
+        AMBSAMP *ap;
-+
+        RAY     ar;
-+
+        double  asum[3];
-+
+        float   *ep;
-+
+        int     i, j, n;
-+
-+
+        if (earr == NULL)               /* just skip calc. if no memory */
-+
+                return;
-+
+                                        /* accumulate estimated variances */
-+
+        for (ep = earr + hp->ns*hp->ns; ep-- > earr; )
-+
+                e2rem += *ep;
-+
+        ep = earr;                      /* perform super-sampling */
-+
+        for (ap = hp->sa, i = 0; i < hp->ns; i++)
-+
+            for (j = 0; j < hp->ns; j++, ap++) {
-+
+                int     nss = *ep/e2rem*cnt + frandom();
-+
+                asum[0] = asum[1] = asum[2] = 0.0;
-+
+                for (n = 1; n <= nss; n++) {
-+
+                        if (!getambsamp(&ar, hp, i, j, n)) {
-+
+                                nss = n-1;
-+
+                                break;
-+
+                        }
-+
+                        addcolor(asum, ar.rcol);
-+
+                }
-+
+                if (nss) {              /* update returned ambient value */
-+
+                        const double    ssf = 1./(nss + 1.);
-+
+                        for (n = 3; n--; )
-+
+                                acol[n] += ssf*asum[n] +
-+
+                                                (ssf - 1.)*colval(ap->v,n);
-+
+                }
-+
+                e2rem -= *ep++;         /* update remainders */
-+
+                cnt -= nss;
-+
+        }
-+
+        free(earr);
-+
+}
-+
-+
-+
+/* Compute vertex flags, indicating farthest in each direction */
-+
+static uby8 *
-+
+vertex_flags(AMBHEMI *hp)
-+
+{
-+
+        uby8    *vflags = (uby8 *)calloc(hp->ns*hp->ns, sizeof(uby8));
-+
+        uby8    *vf;
-+
+        AMBSAMP *ap;
-+
+        int     i, j;
-+
-+
+        if (vflags == NULL)
-+
+                error(SYSTEM, "out of memory in vertex_flags()");
-+
+        vf = vflags;
-+
+        ap = hp->sa;            /* compute farthest along first row */
-+
+        for (j = 0; j < hp->ns-1; j++, vf++, ap++)
-+
+                if (ap[0].d <= ap[1].d)
-+
+                        vf[0] |= 1<<VDB_X;
-+
+                else
-+
+                        vf[1] |= 1<<VDB_x;
-+
+        ++vf; ++ap;
-+
+                                /* flag subsequent rows */
-+
+        for (i = 1; i < hp->ns; i++) {
-+
+            for (j = 0; j < hp->ns-1; j++, vf++, ap++) {
-+
+                if (ap[0].d <= ap[-hp->ns].d)   /* row before */
-+
+                        vf[0] |= 1<<VDB_y;
-+
+                else
-+
+                        vf[-hp->ns] |= 1<<VDB_Y;
-+
+                if (ap[0].d <= ap[1-hp->ns].d)  /* diagonal we care about */
-+
+                        vf[0] |= 1<<VDB_Xy;
-+
+                else
-+
+                        vf[1-hp->ns] |= 1<<VDB_xY;
-+
+                if (ap[0].d <= ap[1].d)         /* column after */
-+
+                        vf[0] |= 1<<VDB_X;
-+
+                else
-+
+                        vf[1] |= 1<<VDB_x;
-+
+            }
-+
+            if (ap[0].d <= ap[-hp->ns].d)       /* final column edge */
-+
+                vf[0] |= 1<<VDB_y;
-+
+            else
-+
+                vf[-hp->ns] |= 1<<VDB_Y;
-+
+            ++vf; ++ap;
-+
+        }
-+
+        return(vflags);
-+
+}
-+
-+
-+
+/* Return brightness of farthest ambient sample */
-+
+static double
-+
+back_ambval(AMBHEMI *hp, int i, int j, int dbit1, int dbit2, const uby8 *vflags)
-+
+{
-+
+        const int       v0 = ambndx(hp,i,j);
-+
+        const int       tflags = (1<<dbit1 | 1<<dbit2);
-+
+        int             v1, v2;
-+
-+
+        if ((vflags[v0] & tflags) == tflags)    /* is v0 the farthest? */
-+
+                return(colval(hp->sa[v0].v,CIEY));
-+
+        v1 = adjacent_verti(hp, i, j, dbit1);
-+
+        if (vflags[v0] & 1<<dbit2)              /* v1 farthest if v0>v2 */
-+
+                return(colval(hp->sa[v1].v,CIEY));
-+
+        v2 = adjacent_verti(hp, i, j, dbit2);
-+
+        if (vflags[v0] & 1<<dbit1)              /* v2 farthest if v0>v1 */
-+
+                return(colval(hp->sa[v2].v,CIEY));
-+
+                                                /* else check if v1>v2 */
-+
+        if (vflags[v1] & 1<<vdb_edge(dbit1,dbit2))
-+
+                return(colval(hp->sa[v1].v,CIEY));
-+
+        return(colval(hp->sa[v2].v,CIEY));
-+
+}
-+
-+
+/* Compute vectors and coefficients for Hessian/gradient calcs */
+static void
-<
+comp_fftri(FFTRI *ftp, float ap0[3], float ap1[3], FVECT rop)
->
+comp_fftri(FFTRI *ftp, AMBHEMI *hp, int i, int j, int dbit, const uby8 *vflags)
-<
+        FVECT   v1;
-<
+        double  dot_e, dot_er, dot_r, dot_r1;
->
+        const int       i0 = ambndx(hp,i,j);
->
+        double          rdot_cp, dot_e, dot_er, rdot_r, rdot_r1, J2;
->
+        int             i1, ii;
-<
+        VSUB(ftp->r_i, ap0, rop);
-<
+        VSUB(ftp->r_i1, ap1, rop);
-<
+        VSUB(ftp->e_i, ap1, ap0);
-<
+        VCROSS(v1, ftp->e_i, ftp->r_i);
-<
+        ftp->nf = 1.0/DOT(v1,v1);
-<
+        VCROSS(v1, ftp->r_i, ftp->r_i1);
-<
+        ftp->I1 = sqrt(DOT(v1,v1)*ftp->nf);
->
+        ftp->valid = 0;                 /* check if we can skip this edge */
->
+        ii = adjacent_trifl[dbit];
->
+        if ((vflags[i0] & ii) == ii)    /* cancels if vertex used as value */
->
+                return;
->
+        i1 = adjacent_verti(hp, i, j, dbit);
->
+        ii = adjacent_trifl[VDB_OPP(dbit)];
->
+        if ((vflags[i1] & ii) == ii)    /* on either end (for both triangles) */
->
+                return;
->
+                                        /* else go ahead with calculation */
->
+        VSUB(ftp->r_i, hp->sa[i0].p, hp->rp->rop);
->
+        VSUB(ftp->r_i1, hp->sa[i1].p, hp->rp->rop);
->
+        VSUB(ftp->e_i, hp->sa[i1].p, hp->sa[i0].p);
->
+        VCROSS(ftp->rcp, ftp->r_i, ftp->r_i1);
->
+        rdot_cp = 1.0/DOT(ftp->rcp,ftp->rcp);
+        dot_e = DOT(ftp->e_i,ftp->e_i);
+        dot_er = DOT(ftp->e_i, ftp->r_i);
-<
+        dot_r = DOT(ftp->r_i,ftp->r_i);
-<
+        dot_r1 = DOT(ftp->r_i1,ftp->r_i1);
-<
+        ftp->I2 = ( DOT(ftp->e_i, ftp->r_i1)/dot_r1 - dot_er/dot_r +
-<
+                        dot_e*ftp->I1 )*0.5*ftp->nf;
-<
+        ftp->J2 =  0.25*ftp->nf*( 1.0/dot_r - 1.0/dot_r1 ) -
-<
+                        dot_er/dot_e*ftp->I2;
->
+        rdot_r = 1.0/DOT(ftp->r_i,ftp->r_i);
->
+        rdot_r1 = 1.0/DOT(ftp->r_i1,ftp->r_i1);
->
+        ftp->I1 = acos( DOT(ftp->r_i, ftp->r_i1) * sqrt(rdot_r*rdot_r1) ) *
->
+                        sqrt( rdot_cp );
->
+        ftp->I2 = ( DOT(ftp->e_i, ftp->r_i1)*rdot_r1 - dot_er*rdot_r +
->
+                        dot_e*ftp->I1 )*0.5*rdot_cp;
->
+        J2 =  ( 0.5*(rdot_r - rdot_r1) - dot_er*ftp->I2 ) / dot_e;
->
+        for (ii = 3; ii--; )
->
+                ftp->rI2_eJ2[ii] = ftp->I2*ftp->r_i[ii] + J2*ftp->e_i[ii];
->
+        ftp->valid++;
+static void
+comp_hessian(FVECT hess[3], FFTRI *ftp, FVECT nrm)
-<
+        FVECT   v1, v2;
->
+        FVECT   ncp;
+        FVECT   m1[3], m2[3], m3[3], m4[3];
+        double  d1, d2, d3, d4;
+        double  I3, J3, K3;
+        int     i, j;
-+
-+
+        if (!ftp->valid) {              /* preemptive test */
-+
+                memset(hess, 0, sizeof(FVECT)*3);
-+
+                return;
-+
+        }
+                                        /* compute intermediate coefficients */
+        d1 = 1.0/DOT(ftp->r_i,ftp->r_i);
+        d2 = 1.0/DOT(ftp->r_i1,ftp->r_i1);
+        d3 = 1.0/DOT(ftp->e_i,ftp->e_i);
+        d4 = DOT(ftp->e_i, ftp->r_i);
-<
+        I3 = 0.25*ftp->nf*( DOT(ftp->e_i, ftp->r_i1)*d2*d2 - d4*d1*d1 +
-<
+.0*d3*ftp->I2 );
->
+        I3 = ( DOT(ftp->e_i, ftp->r_i1)*d2*d2 - d4*d1*d1 + 3.0/d3*ftp->I2 )
->
+                        / ( 4.0*DOT(ftp->rcp,ftp->rcp) );
+        J3 = 0.25*d3*(d1*d1 - d2*d2) - d4*d3*I3;
+        K3 = d3*(ftp->I2 - I3/d1 - 2.0*d4*J3);
+                                        /* intermediate matrices */
-<
+        VCROSS(v1, nrm, ftp->e_i);
-<
+        for (j = 3; j--; )
-<
+                v2[j] = ftp->I2*ftp->r_i[j] + ftp->J2*ftp->e_i[j];
-<
+        compose_matrix(m1, v1, v2);
->
+        VCROSS(ncp, nrm, ftp->e_i);
->
+        compose_matrix(m1, ncp, ftp->rI2_eJ2);
+        compose_matrix(m2, ftp->r_i, ftp->r_i);
+        compose_matrix(m3, ftp->e_i, ftp->e_i);
+        compose_matrix(m4, ftp->r_i, ftp->e_i);
-<
+        VCROSS(v1, ftp->r_i, ftp->e_i);
-<
+        d1 = DOT(nrm, v1);
->
+        d1 = DOT(nrm, ftp->rcp);
+        d2 = -d1*ftp->I2;
+        d1 *= 2.0;
+        for (i = 3; i--; )              /* final matrix sum */
+/* Add to radiometric Hessian from the given triangle */
+static void
+add2hessian(FVECT hess[3], FVECT ehess1[3],
-<
+                FVECT ehess2[3], FVECT ehess3[3], COLORV v)
->
+                FVECT ehess2[3], FVECT ehess3[3], double v)
+        int     i, j;
+static void
+comp_gradient(FVECT grad, FFTRI *ftp, FVECT nrm)
-<
+        FVECT   vcp;
->
+        FVECT   ncp;
+        double  f1;
+        int     i;
-<
+        VCROSS(vcp, ftp->r_i, ftp->r_i1);
-<
+        f1 = 2.0*DOT(nrm, vcp);
-<
+        VCROSS(vcp, nrm, ftp->e_i);
->
+        if (!ftp->valid) {              /* preemptive test */
->
+                memset(grad, 0, sizeof(FVECT));
->
+                return;
->
+        }
->
+        f1 = 2.0*DOT(nrm, ftp->rcp);
->
+        VCROSS(ncp, nrm, ftp->e_i);
+        for (i = 3; i--; )
-<
+                grad[i] = (0.5/PI)*( ftp->I1*vcp[i] +
-<
+                            f1*(ftp->I2*ftp->r_i[i] + ftp->J2*ftp->e_i[i]) );
->
+                grad[i] = (0.5/PI)*( ftp->I1*ncp[i] + f1*ftp->rI2_eJ2[i] );
+/* Add to displacement gradient from the given triangle */
+static void
-<
+add2gradient(FVECT grad, FVECT egrad1, FVECT egrad2, FVECT egrad3, COLORV v)
->
+add2gradient(FVECT grad, FVECT egrad1, FVECT egrad2, FVECT egrad3, double v)
+        int     i;
-–
+/* Return brightness of furthest ambient sample */
-–
+static COLORV
-–
+back_ambval(struct s_ambsamp *ap1, struct s_ambsamp *ap2,
-–
+                struct s_ambsamp *ap3, FVECT orig)
-–
+{
-–
+        COLORV  vback;
-–
+        FVECT   vec;
-–
+        double  d2, d2best;
-–
-–
+        VSUB(vec, ap1->p, orig);
-–
+        d2best = DOT(vec,vec);
-–
+        vback = ap1->v[CIEY];
-–
+        VSUB(vec, ap2->p, orig);
-–
+        d2 = DOT(vec,vec);
-–
+        if (d2 > d2best) {
-–
+                d2best = d2;
-–
+                vback = ap2->v[CIEY];
-–
+        }
-–
+        VSUB(vec, ap3->p, orig);
-–
+        d2 = DOT(vec,vec);
-–
+        if (d2 > d2best)
-–
+                return(ap3->v[CIEY]);
-–
+        return(vback);
-–
+}
-–
-–
+/* Compute anisotropic radii and eigenvector directions */
-<
+static int
->
+static void
+eigenvectors(FVECT uv[2], float ra[2], FVECT hessian[3])
+        double  hess2[2][2];
+        hess2[0][1] = DOT(uv[0], b);
+        hess2[1][0] = DOT(uv[1], a);
+        hess2[1][1] = DOT(uv[1], b);
-<
+                                        /* compute eigenvalues */
-<
+        if ( quadratic(evalue, 1.0, -hess2[0][0]-hess2[1][1],
-<
+                        hess2[0][0]*hess2[1][1]-hess2[0][1]*hess2[1][0]) != 2 ||
-<
+                        (evalue[0] = fabs(evalue[0])) <= FTINY*FTINY ||
-<
+                        (evalue[1] = fabs(evalue[1])) <= FTINY*FTINY )
-<
+                error(INTERNAL, "bad eigenvalue calculation");
-<
->
+                                        /* compute eigenvalue(s) */
->
+        i = quadratic(evalue, 1.0, -hess2[0][0]-hess2[1][1],
->
+                        hess2[0][0]*hess2[1][1]-hess2[0][1]*hess2[1][0]);
->
+        if (i == 1)                     /* double-root (circle) */
->
+                evalue[1] = evalue[0];
->
+        if (!i || ((evalue[0] = fabs(evalue[0])) <= FTINY*FTINY) |
->
+                        ((evalue[1] = fabs(evalue[1])) <= FTINY*FTINY) ) {
->
+                ra[0] = ra[1] = maxarad;
->
+                return;
->
+        }
+        if (evalue[0] > evalue[1]) {
-<
+                ra[0] = 1.0/sqrt(sqrt(evalue[0]));
-<
+                ra[1] = 1.0/sqrt(sqrt(evalue[1]));
->
+                ra[0] = sqrt(sqrt(4.0/evalue[0]));
->
+                ra[1] = sqrt(sqrt(4.0/evalue[1]));
+                slope1 = evalue[1];
+        } else {
-<
+                ra[0] = 1.0/sqrt(sqrt(evalue[1]));
-<
+                ra[1] = 1.0/sqrt(sqrt(evalue[0]));
->
+                ra[0] = sqrt(sqrt(4.0/evalue[1]));
->
+                ra[1] = sqrt(sqrt(4.0/evalue[0]));
+                slope1 = evalue[0];
+                                        /* compute unit eigenvectors */
+        static char     memerrmsg[] = "out of memory in ambHessian()";
+        FVECT           (*hessrow)[3] = NULL;
+        FVECT           *gradrow = NULL;
-+
+        uby8            *vflags;
+        FVECT           hessian[3];
+        FVECT           gradient;
+        FFTRI           fftr;
+                        error(SYSTEM, memerrmsg);
+                memset(gradient, 0, sizeof(gradient));
-+
+                                        /* get vertex position flags */
-+
+        vflags = vertex_flags(hp);
+                                        /* compute first row of edges */
+        for (j = 0; j < hp->ns-1; j++) {
-<
+                comp_fftri(&fftr, ambsamp(hp,0,j).p,
-<
+                                ambsamp(hp,0,j+1).p, hp->rp->rop);
->
+                comp_fftri(&fftr, hp, 0, j, VDB_X, vflags);
+                if (hessrow != NULL)
+                        comp_hessian(hessrow[j], &fftr, hp->rp->ron);
+                if (gradrow != NULL)
+        for (i = 0; i < hp->ns-1; i++) {
+            FVECT       hesscol[3];     /* compute first vertical edge */
+            FVECT       gradcol;
-<
+            comp_fftri(&fftr, ambsamp(hp,i,0).p,
-<
+                        ambsamp(hp,i+1,0).p, hp->rp->rop);
->
+            comp_fftri(&fftr, hp, i, 0, VDB_Y, vflags);
+            if (hessrow != NULL)
+                comp_hessian(hesscol, &fftr, hp->rp->ron);
+            if (gradrow != NULL)
+            for (j = 0; j < hp->ns-1; j++) {
+                FVECT   hessdia[3];     /* compute triangle contributions */
+                FVECT   graddia;
-<
+                COLORV  backg;
-<
+                backg = back_ambval(&ambsamp(hp,i,j), &ambsamp(hp,i,j+1),
-<
+                                        &ambsamp(hp,i+1,j), hp->rp->rop);
->
+                double  backg;
->
+                backg = back_ambval(hp, i, j, VDB_X, VDB_Y, vflags);
+                                        /* diagonal (inner) edge */
-<
+                comp_fftri(&fftr, ambsamp(hp,i,j+1).p,
-<
+                                ambsamp(hp,i+1,j).p, hp->rp->rop);
->
+                comp_fftri(&fftr, hp, i, j+1, VDB_xY, vflags);
+                if (hessrow != NULL) {
+                    comp_hessian(hessdia, &fftr, hp->rp->ron);
+                    rev_hessian(hesscol);
+                    add2hessian(hessian, hessrow[j], hessdia, hesscol, backg);
-<
+                if (gradient != NULL) {
->
+                if (gradrow != NULL) {
+                    comp_gradient(graddia, &fftr, hp->rp->ron);
+                    rev_gradient(gradcol);
+                    add2gradient(gradient, gradrow[j], graddia, gradcol, backg);
+                                        /* initialize edge in next row */
-<
+                comp_fftri(&fftr, ambsamp(hp,i+1,j+1).p,
-<
+                                ambsamp(hp,i+1,j).p, hp->rp->rop);
->
+                comp_fftri(&fftr, hp, i+1, j+1, VDB_x, vflags);
+                if (hessrow != NULL)
+                    comp_hessian(hessrow[j], &fftr, hp->rp->ron);
+                if (gradrow != NULL)
+                    comp_gradient(gradrow[j], &fftr, hp->rp->ron);
+                                        /* new column edge & paired triangle */
-<
+                backg = back_ambval(&ambsamp(hp,i,j+1), &ambsamp(hp,i+1,j+1),
-<
+                                        &ambsamp(hp,i+1,j), hp->rp->rop);
-<
+                comp_fftri(&fftr, ambsamp(hp,i,j+1).p, ambsamp(hp,i+1,j+1).p,
-<
+                                hp->rp->rop);
->
+                backg = back_ambval(hp, i+1, j+1, VDB_x, VDB_y, vflags);
->
+                comp_fftri(&fftr, hp, i, j+1, VDB_Y, vflags);
+                if (hessrow != NULL) {
+                    comp_hessian(hesscol, &fftr, hp->rp->ron);
+                    rev_hessian(hessdia);
+                                        /* release row buffers */
+        if (hessrow != NULL) free(hessrow);
+        if (gradrow != NULL) free(gradrow);
-+
+        free(vflags);
+        if (ra != NULL)                 /* extract eigenvectors & radii */
+                eigenvectors(uv, ra, hessian);
-<
+        if (pg != NULL) {               /* project position gradient */
->
+        if (pg != NULL) {               /* tangential position gradient */
+                pg[0] = DOT(gradient, uv[0]);
+                pg[1] = DOT(gradient, uv[1]);
+static void
+ambdirgrad(AMBHEMI *hp, FVECT uv[2], float dg[2])
-<
+        struct s_ambsamp        *ap;
-<
+        int                     n;
-<
+        FVECT                   vd;
-<
+        double                  gfact;
->
+        AMBSAMP *ap;
->
+        double  dgsum[2];
->
+        int     n;
->
+        FVECT   vd;
->
+        double  gfact;
-<
+        dg[0] = dg[1] = 0;
->
+        dgsum[0] = dgsum[1] = 0.0;      /* sum values times -tan(theta) */
+        for (ap = hp->sa, n = hp->ns*hp->ns; n--; ap++) {
+                                        /* use vector for azimuth + 90deg */
+                VSUB(vd, ap->p, hp->rp->rop);
-<
+                                        /* brightness with tangent factor */
-<
+                gfact = ap->v[CIEY] / DOT(hp->rp->ron, vd);
->
+                                        /* brightness over cosine factor */
->
+                gfact = colval(ap->v,CIEY) / DOT(hp->rp->ron, vd);
+                                        /* sine = proj_radius/vd_length */
-<
+                dg[0] -= DOT(uv[1], vd) * gfact;
-<
+                dg[1] += DOT(uv[0], vd) * gfact;
->
+                dgsum[0] -= DOT(uv[1], vd) * gfact;
->
+                dgsum[1] += DOT(uv[0], vd) * gfact;
-+
+        dg[0] = dgsum[0] / (hp->ns*hp->ns);
-+
+        dg[1] = dgsum[1] / (hp->ns*hp->ns);
-+
+/* Compute potential light leak direction flags for cache value */
-+
+static uint32
-+
+ambcorral(AMBHEMI *hp, FVECT uv[2], const double r0, const double r1)
-+
+{
-+
+        const double    max_d = 1.0/(minarad*ambacc + 0.001);
-+
+        const double    ang_res = 0.5*PI/(hp->ns-1);
-+
+        const double    ang_step = ang_res/((int)(16/PI*ang_res) + (1+FTINY));
-+
+        double          avg_d = 0;
-+
+        uint32          flgs = 0;
-+
+        int             i, j;
-+
+                                        /* don't bother for a few samples */
-+
+        if (hp->ns < 12)
-+
+                return(0);
-+
+                                        /* check distances overhead */
-+
+        for (i = hp->ns*3/4; i-- > hp->ns>>2; )
-+
+            for (j = hp->ns*3/4; j-- > hp->ns>>2; )
-+
+                avg_d += ambsam(hp,i,j).d;
-+
+        avg_d *= 4.0/(hp->ns*hp->ns);
-+
+        if (avg_d*r0 >= 1.0)            /* ceiling too low for corral? */
-+
+                return(0);
-+
+        if (avg_d >= max_d)             /* insurance */
-+
+                return(0);
-+
+                                        /* else circle around perimeter */
-+
+        for (i = 0; i < hp->ns; i++)
-+
+            for (j = 0; j < hp->ns; j += !i|(i==hp->ns-1) ? 1 : hp->ns-1) {
-+
+                AMBSAMP *ap = &ambsam(hp,i,j);
-+
+                FVECT   vec;
-+
+                double  u, v;
-+
+                double  ang, a1;
-+
+                int     abp;
-+
+                if ((ap->d <= FTINY) | (ap->d >= max_d))
-+
+                        continue;       /* too far or too near */
-+
+                VSUB(vec, ap->p, hp->rp->rop);
-+
+                u = DOT(vec, uv[0]) * ap->d;
-+
+                v = DOT(vec, uv[1]) * ap->d;
-+
+                if ((r0*r0*u*u + r1*r1*v*v) * ap->d*ap->d <= 1.0)
-+
+                        continue;       /* occluder outside ellipse */
-+
+                ang = atan2a(v, u);     /* else set direction flags */
-+
+                for (a1 = ang-.5*ang_res; a1 <= ang+.5*ang_res; a1 += ang_step)
-+
+                        flgs |= 1L<<(int)(16/PI*(a1 + 2.*PI*(a1 < 0)));
-+
+            }
-+
+        return(flgs);
-+
+}
-+
-+
+int
+doambient(                              /* compute ambient component */
+        COLOR   rcol,                   /* input/output color */
+        FVECT   uv[2],                  /* returned (optional) */
+        float   ra[2],                  /* returned (optional) */
+        float   pg[2],                  /* returned (optional) */
-<
+        float   dg[2]                   /* returned (optional) */
->
+        float   dg[2],                  /* returned (optional) */
->
+        uint32  *crlp                   /* returned (optional) */
-<
+        AMBHEMI                 *hp = inithemi(rcol, r, wt);
-<
+        int                     cnt = 0;
-<
+        FVECT                   my_uv[2];
-<
+        double                  d, acol[3];
-<
+        struct s_ambsamp        *ap;
-<
+        int                     i, j;
->
+        AMBHEMI *hp = inithemi(rcol, r, wt);
->
+        int     cnt;
->
+        FVECT   my_uv[2];
->
+        double  d, K, acol[3];
->
+        AMBSAMP *ap;
->
+        int     i, j;
+                                        /* check/initialize */
+        if (hp == NULL)
+                return(0);
+                pg[0] = pg[1] = 0.0;
+        if (dg != NULL)
+                dg[0] = dg[1] = 0.0;
-+
+        if (crlp != NULL)
-+
+                *crlp = 0;
+                                        /* sample the hemisphere */
+        acol[0] = acol[1] = acol[2] = 0.0;
-+
+        cnt = 0;
+        for (i = hp->ns; i--; )
+                for (j = hp->ns; j--; )
+                        if ((ap = ambsample(hp, i, j)) != NULL) {
+                free(hp);
+                return(0);              /* no valid samples */
-<
+        d = 1.0 / cnt;                  /* final indirect irradiance/PI */
-<
+        acol[0] *= d; acol[1] *= d; acol[2] *= d;
-<
+        copycolor(rcol, acol);
-<
+        if (cnt < hp->ns*hp->ns ||      /* incomplete sampling? */
-<
+                        (ra == NULL) & (pg == NULL) & (dg == NULL)) {
->
+        if (cnt < hp->ns*hp->ns) {      /* incomplete sampling? */
->
+                copycolor(rcol, acol);
+                free(hp);
-+
+                return(-1);             /* return value w/o Hessian */
-+
+        }
-+
+        cnt = ambssamp*wt + 0.5;        /* perform super-sampling? */
-+
+        if (cnt > 8)
-+
+                ambsupersamp(acol, hp, cnt);
-+
+        copycolor(rcol, acol);          /* final indirect irradiance/PI */
-+
+        if ((ra == NULL) & (pg == NULL) & (dg == NULL)) {
-+
+                free(hp);
+                return(-1);             /* no radius or gradient calc. */
-<
+        d = 0.01 * bright(rcol);        /* add in 1% before Hessian comp. */
-<
+        if (d < FTINY) d = FTINY;
-<
+        ap = hp->sa;                    /* using Y channel from here on... */
->
+        if ((d = bright(acol)) > FTINY) {       /* normalize Y values */
->
+                d = 0.99*(hp->ns*hp->ns)/d;
->
+                K = 0.01;
->
+        } else {                        /* or fall back on geometric Hessian */
->
+                K = 1.0;
->
+                pg = NULL;
->
+                dg = NULL;
->
+                crlp = NULL;
->
+        }
->
+        ap = hp->sa;                    /* relative Y channel from here on... */
+        for (i = hp->ns*hp->ns; i--; ap++)
-<
+                colval(ap->v,CIEY) = bright(ap->v) + d;
->
+                colval(ap->v,CIEY) = bright(ap->v)*d + K;
+        if (uv == NULL)                 /* make sure we have axis pointers */
+                uv = my_uv;
+                                        /* compute radii & pos. gradient */
+        ambHessian(hp, uv, ra, pg);
-+
+        if (dg != NULL)                 /* compute direction gradient */
+                ambdirgrad(hp, uv, dg);
-+
+        if (ra != NULL) {               /* scale/clamp radii */
-<
+                d = sqrt(sqrt((4.0/PI)*bright(rcol)/wt));
-<
+                ra[0] *= d;
->
+                if (pg != NULL) {
->
+                        if (ra[0]*(d = fabs(pg[0])) > 1.0)
->
+                                ra[0] = 1.0/d;
->
+                        if (ra[1]*(d = fabs(pg[1])) > 1.0)
->
+                                ra[1] = 1.0/d;
->
+                        if (ra[0] > ra[1])
->
+                                ra[0] = ra[1];
->
+                }
->
+                if (ra[0] < minarad) {
->
+                        ra[0] = minarad;
->
+                        if (ra[1] < minarad)
->
+                                ra[1] = minarad;
->
+                }
->
+                ra[0] *= d = 1.0/sqrt(sqrt(wt));
+                if ((ra[1] *= d) > 2.0*ra[0])
+                        ra[1] = 2.0*ra[0];
+                if (ra[1] > maxarad) {
+                        ra[1] = maxarad;
+                        if (ra[0] > maxarad)
+                                ra[0] = maxarad;
-+
+                }
-+
+                                        /* flag encroached directions */
-+
+                if ((wt >= 0.5-FTINY) & (crlp != NULL))
-+
+                        *crlp = ambcorral(hp, uv, ra[0]*ambacc, ra[1]*ambacc);
-+
+                if (pg != NULL) {       /* cap gradient if necessary */
-+
+                        d = pg[0]*pg[0]*ra[0]*ra[0] + pg[1]*pg[1]*ra[1]*ra[1];
-+
+                        if (d > 1.0) {
-+
+                                d = 1.0/sqrt(d);
-+
+                                pg[0] *= d;
-+
+                                pg[1] *= d;
-+
+                        }
+        free(hp);                       /* clean up and return */

Diff Legend

-–
+Removed lines
-+
+Added lines
-<
+Changed lines (old)
->
+Changed lines (new)

Comparing ray/src/rt/ambcomp.c (file contents): Revision 2.28 by greg, Sat Apr 19 19:20:47 2014 UTC vs. Revision 2.54 by greg, Fri May 9 04:55:19 2014 UTC

Diff Legend

Comparing ray/src/rt/ambcomp.c (file contents):
Revision 2.28 by greg, Sat Apr 19 19:20:47 2014 UTC vs.
Revision 2.54 by greg, Fri May 9 04:55:19 2014 UTC