m/fast: add some fast maths approximations

2015-07-29 16:11:48 +10:00 · 2015-07-29 16:11:48 +10:00 · eb155d5bb0
commit eb155d5bb0
parent 48d6a007a2
4 changed files with 193 additions and 0 deletions
--- a/Makefile.am
+++ b/Makefile.am
@ -127,6 +127,8 @@ UTIL_FILES   =			\
    maths.cpp			\
    maths.hpp			\
    maths.ipp			\
    maths/fast.hpp		\
    maths/fast.ipp		\
    matrix.cpp			\
    matrix.hpp			\
    matrix.ipp			\
@ -335,6 +337,7 @@ TEST_BIN = 			\
    test/json_types		\
    test/ray 			\
    test/maths			\
    test/maths_fast		\
    test/matrix			\
    test/md2			\
    test/md4			\
--- a/maths/fast.hpp
+++ b/maths/fast.hpp
@ -0,0 +1,44 @@
 /*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 * Copyright 2015 Danny Robson <danny@nerdcruft.net>
 */
 #ifndef __UTIL_MATHS_FAST_HPP
 #define __UTIL_MATHS_FAST_HPP
 namespace util { namespace maths { namespace fast {
    ///////////////////////////////////////////////////////////////////////////
    constexpr float pow (float, float);
    constexpr float pow2 (float);
    ///////////////////////////////////////////////////////////////////////////
    constexpr float exp (float);
    ///////////////////////////////////////////////////////////////////////////
    constexpr float log (float);
    constexpr float log2 (float);
    ///////////////////////////////////////////////////////////////////////////
    constexpr float sqrt (float);
    constexpr float invsqrt (float);
 } } }
 #include "fast.ipp"
 #endif
--- a/maths/fast.ipp
+++ b/maths/fast.ipp
@ -0,0 +1,107 @@
 /*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 *
 * Copyright 2015 Danny Robson <danny@nerdcruft.net>
 */
 #ifdef __UTIL_MATHS_FAST_IPP
 #error
 #endif
 #define __UTIL_MATHS_FAST_IPP
 namespace util { namespace maths { namespace fast {
    ///////////////////////////////////////////////////////////////////////////
    constexpr float
    pow2 (float p)
    {
        float offset = (p < 0) ? 1.0f : 0.0f;
        float clipp = (p < -126) ? -126.0f : p;
        int32_t w = static_cast<int32_t> (clipp);
        float z = clipp - w + offset;
        union { uint32_t i; float f; } v = { static_cast<uint32_t> ( (1 << 23) * (clipp + 121.2740575f + 27.7280233f / (4.84252568f - z) - 1.49012907f * z) ) };
        return v.f;
        //float clipp = (p < -126) ? -126.0f : p;
        //union { uint32_t i; float f; } v = { static_cast<uint32_t> ( (1 << 23) * (clipp + 126.94269504f) ) };
        //return v.f;
    }
    constexpr float
    log2 (float x)
    {
        union { float f; uint32_t i; } vx = { x };
        union { uint32_t i; float f; } mx = { (vx.i & 0x007FFFFF) | 0x3f000000 };
        float y = vx.i;
        y *= 1.1920928955078125e-7f;
        return y - 124.22551499f
            - 1.498030302f * mx.f 
            - 1.72587999f / (0.3520887068f + mx.f);
        //union { float f; uint32_t i; } vx = { x };
        //float y = vx.i;
        //y *= 1.1920928955078125e-7f;
        //return y - 126.94269504f;
    }
    constexpr float
    log (float x)
    {
        return 0.69314718f * log2 (x);
    }
    constexpr float
    pow (float a, float b)
    {
        return pow2 (b * log2 (a));
    }
    constexpr float
    sqrt (float x)
    {
        //return pow (x, 0.5f);
        union { float f; int32_t i; } u  = { x };
        int32_t v = u.i;
        v  -= 1 << 23;
        v >>= 1;
        v  += 1 << 29;
        u.i = v;
        return u.f;
    }
    constexpr float
    invsqrt (float x)
    {
        union
        {
            float x;
            int32_t i;
        } u = { x };
        u.i = 0x5f3759df - (u.i >> 1);
        // refine estimate. repeat as necessary.
        u.x = u.x * (1.5f - x * 0.5f * u.x * u.x);
        return u.x;
    }
 } } }
--- a/test/maths_fast.cpp
+++ b/test/maths_fast.cpp
@ -0,0 +1,39 @@
 #include "tap.hpp"
 #include "maths/fast.hpp"
 constexpr float
 threshold (float a, float b)
 {
    constexpr float PARTS = 100;
    return std::abs (a + b) / 2 / PARTS;
 }
 int
 main (void)
 {
    util::TAP::logger tap;
    {
        auto a = util::maths::fast::log2 (3.456f);
        auto b = std::log2 (3.456f);
        tap.expect_lt (std::abs (a - b), threshold (a, b), "fast log2");
    }
    {
        auto a = util::maths::fast::pow2 (-100.f);
        auto b = std::pow (2.f, -100.f);
        tap.expect_lt (std::abs (a - b), threshold (a, b), "fast pow2");
    }
    {
        auto a = util::maths::fast::pow (0.8f, 100.f);
        auto b = std::pow (0.8f, 100.f);
        tap.expect_lt (std::abs (a - b), threshold (a, b), "fast pow");
    }
    return tap.status ();
 }