PtexExtractor/ptex/PtexUtils.h

#ifndef PtexUtils_h
#define PtexUtils_h

/* 
PTEX SOFTWARE
Copyright 2009 Disney Enterprises, Inc.  All rights reserved

Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are
met:

  * Redistributions of source code must retain the above copyright
    notice, this list of conditions and the following disclaimer.

  * Redistributions in binary form must reproduce the above copyright
    notice, this list of conditions and the following disclaimer in
    the documentation and/or other materials provided with the
    distribution.

  * The names "Disney", "Walt Disney Pictures", "Walt Disney Animation
    Studios" or the names of its contributors may NOT be used to
    endorse or promote products derived from this software without
    specific prior written permission from Walt Disney Pictures.

Disclaimer: THIS SOFTWARE IS PROVIDED BY WALT DISNEY PICTURES AND
CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING,
BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY, FITNESS
FOR A PARTICULAR PURPOSE, NONINFRINGEMENT AND TITLE ARE DISCLAIMED.
IN NO EVENT SHALL WALT DISNEY PICTURES, THE COPYRIGHT HOLDER OR
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND BASED ON ANY
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.
*/

#include "Ptexture.h"

struct PtexUtils : public Ptex {

    static bool isPowerOfTwo(int x)
    {
    return !(x&(x-1));
    }

    static uint32_t ones(uint32_t x)
    {
    // count number of ones
    x = (x & 0x55555555) + ((x >> 1) & 0x55555555); // add pairs of bits
    x = (x & 0x33333333) + ((x >> 2) & 0x33333333); // add bit pairs
    x = (x & 0x0f0f0f0f) + ((x >> 4) & 0x0f0f0f0f); // add nybbles
    x += (x >> 8);                              // add bytes
    x += (x >> 16);                                 // add words
    return(x & 0xff);
    }

    static uint32_t floor_log2(uint32_t x)
    {
    // floor(log2(n))
    x |= (x >> 1);
    x |= (x >> 2);
    x |= (x >> 4);
    x |= (x >> 8);
    x |= (x >> 16);
    return ones(x>>1);
    }

    static uint32_t ceil_log2(uint32_t x)
    {
    // ceil(log2(n))
    bool isPow2 = isPowerOfTwo(x);
    x |= (x >> 1);
    x |= (x >> 2);
    x |= (x >> 4);
    x |= (x >> 8);
    x |= (x >> 16);
    return ones(x>>1) + !isPow2;
    }

    static double smoothstep(double x, double a, double b)
    {
    if ( x < a ) return 0;
    if ( x >= b ) return 1;
    x = (x - a)/(b - a);
    return x*x * (3 - 2*x);
    }

    static double qsmoothstep(double x, double a, double b)
    {
    // quintic smoothstep (cubic is only C1)
    if ( x < a ) return 0;
    if ( x >= b ) return 1;
    x = (x - a)/(b - a);
    return x*x*x * (10 + x * (-15 + x*6));
    }

    template<typename T>
    static T cond(bool c, T a, T b) { return c * a + (!c)*b; }

    template<typename T>
    static T min(T a, T b) { return cond(a < b, a, b); }

    template<typename T>
    static T max(T a, T b) { return cond(a >= b, a, b); }

    template<typename T>
    static T clamp(T x, T lo, T hi) { return cond(x < lo, lo, cond(x > hi, hi, x)); }

    static bool isConstant(const void* data, int stride, int ures, int vres, 
               int pixelSize);
    static void interleave(const void* src, int sstride, int ures, int vres, 
               void* dst, int dstride, DataType dt, int nchannels);
    static void deinterleave(const void* src, int sstride, int ures, int vres, 
                 void* dst, int dstride, DataType dt, int nchannels);
    static void encodeDifference(void* data, int size, DataType dt);
    static void decodeDifference(void* data, int size, DataType dt);
    typedef void ReduceFn(const void* src, int sstride, int ures, int vres,
              void* dst, int dstride, DataType dt, int nchannels);
    static void reduce(const void* src, int sstride, int ures, int vres,
               void* dst, int dstride, DataType dt, int nchannels);
    static void reduceu(const void* src, int sstride, int ures, int vres,
            void* dst, int dstride, DataType dt, int nchannels);
    static void reducev(const void* src, int sstride, int ures, int vres,
            void* dst, int dstride, DataType dt, int nchannels);
    static void reduceTri(const void* src, int sstride, int ures, int vres,
              void* dst, int dstride, DataType dt, int nchannels);
    static void average(const void* src, int sstride, int ures, int vres,
            void* dst, DataType dt, int nchannels);
    static void fill(const void* src, void* dst, int dstride,
             int ures, int vres, int pixelsize);
    static void copy(const void* src, int sstride, void* dst, int dstride,
             int nrows, int rowlen);
    static void blend(const void* src, float weight, void* dst, bool flip,
              int rowlen, DataType dt, int nchannels);
    static void multalpha(void* data, int npixels, DataType dt, int nchannels, int alphachan);
    static void divalpha(void* data, int npixels, DataType dt, int nchannels, int alphachan);

    static void genRfaceids(const FaceInfo* faces, int nfaces, 
                uint32_t* rfaceids, uint32_t* faceids);

    // fixed length vector accumulator: dst[i] += val[i] * weight
    template<typename T, int n>
    struct VecAccum {
    VecAccum() {}
    void operator()(double* dst, const T* val, double weight) 
    {
        *dst += *val * weight;
        // use template to unroll loop
        VecAccum<T,n-1>()(dst+1, val+1, weight);
    }
    };
    template<typename T>
    struct VecAccum<T,0> { void operator()(double*, const T*, double) {} };

    // variable length vector accumulator: dst[i] += val[i] * weight
    template<typename T>
    struct VecAccumN {
    void operator()(double* dst, const T* val, int nchan, double weight) 
    {
        for (int i = 0; i < nchan; i++) dst[i] += val[i] * weight;
    }
    };

    // fixed length vector multiplier: dst[i] += val[i] * weight
    template<typename T, int n>
    struct VecMult {
    VecMult() {}
    void operator()(double* dst, const T* val, double weight) 
    {
        *dst = *val * weight;
        // use template to unroll loop
        VecMult<T,n-1>()(dst+1, val+1, weight);
    }
    };
    template<typename T>
    struct VecMult<T,0> { void operator()(double*, const T*, double) {} };

    // variable length vector multiplier: dst[i] = val[i] * weight
    template<typename T>
    struct VecMultN {
    void operator()(double* dst, const T* val, int nchan, double weight) 
    {
        for (int i = 0; i < nchan; i++) dst[i] = val[i] * weight;
    }
    };

    typedef void (*ApplyConstFn)(double weight, double* dst, void* data, int nChan);
    static ApplyConstFn applyConstFunctions[20];
    static void applyConst(double weight, double* dst, void* data, Ptex::DataType dt, int nChan)
    {
    // dispatch specialized apply function
    ApplyConstFn fn = applyConstFunctions[((unsigned)nChan<=4)*nChan*4 + dt];
    fn(weight, dst, data, nChan);
    }
};

#endif