diff --git a/glm/gtx/fast_trigonometry.inl b/glm/gtx/fast_trigonometry.inl index 16a821ad..b8c65810 100644 --- a/glm/gtx/fast_trigonometry.inl +++ b/glm/gtx/fast_trigonometry.inl @@ -33,6 +33,16 @@ namespace glm{ namespace detail { + template class vecType> + GLM_FUNC_QUALIFIER vecType taylorCos(vecType const & x) + { + return static_cast(1) + - (x * x) / 2.f + + (x * x * x * x) / 24.f + - (x * x * x * x * x * x) / 720.f + + (x * x * x * x * x * x * x * x) / 40320.f; + } + template GLM_FUNC_QUALIFIER T cos_52s(T x) { @@ -66,11 +76,11 @@ namespace detail { T const angle(wrapAngle(x)); - if(angle()) + if(angle < half_pi()) return detail::cos_52s(angle); - if(angle()) + if(angle < pi()) return -detail::cos_52s(pi() - angle); - if(angle<(T(3) * half_pi())) + if(angle < (T(3) * half_pi())) return -detail::cos_52s(angle - pi()); return detail::cos_52s(two_pi() - angle); diff --git a/test/core/core_func_common.cpp b/test/core/core_func_common.cpp index 9a7c5d94..7911a72f 100644 --- a/test/core/core_func_common.cpp +++ b/test/core/core_func_common.cpp @@ -168,6 +168,22 @@ namespace mod_ { int Error(0); + { + float A(1.5f); + float B(1.0f); + float C = glm::mod(A, B); + + Error += glm::abs(C - 0.5f) < 0.00001f ? 0 : 1; + } + + { + float A(-0.2f); + float B(1.0f); + float C = glm::mod(A, B); + + Error += glm::abs(C - 0.8f) < 0.00001f ? 0 : 1; + } + { float A(3.0); float B(2.0f); diff --git a/test/core/core_func_trigonometric.cpp b/test/core/core_func_trigonometric.cpp index fa391151..abadc6f5 100644 --- a/test/core/core_func_trigonometric.cpp +++ b/test/core/core_func_trigonometric.cpp @@ -30,17 +30,12 @@ /////////////////////////////////////////////////////////////////////////////////// #include -/* -float sin(float x) { - float temp; - temp = (x + M_PI) / ((2 * M_PI) - M_PI); - return limited_sin((x + M_PI) - ((2 * M_PI) - M_PI) * temp)); -} -*/ + int main() { - int Failed = 0; + int Error = 0; - return Failed; + + return Error; } diff --git a/test/gtc/gtc_color.cpp b/test/gtc/gtc_color.cpp index 77759dac..03bd0261 100644 --- a/test/gtc/gtc_color.cpp +++ b/test/gtc/gtc_color.cpp @@ -39,20 +39,34 @@ namespace srgb { int Error(0); - glm::vec4 const ColorSourceRGB(1.0, 0.5, 0.0, 1.0); + glm::vec3 const ColorSourceRGB(1.0, 0.5, 0.0); { - glm::vec4 const ColorSRGB = glm::convertRgbToSrgb(ColorSourceRGB); - glm::vec4 const ColorRGB = glm::convertSrgbToRgb(ColorSRGB); + glm::vec3 const ColorSRGB = glm::convertRgbToSrgb(ColorSourceRGB); + glm::vec3 const ColorRGB = glm::convertSrgbToRgb(ColorSRGB); Error += glm::all(glm::epsilonEqual(ColorSourceRGB, ColorRGB, 0.00001f)) ? 0 : 1; } { - glm::vec4 const ColorSRGB = glm::convertRgbToSrgb(ColorSourceRGB, 2.8f); - glm::vec4 const ColorRGB = glm::convertSrgbToRgb(ColorSRGB, 2.8f); + glm::vec3 const ColorSRGB = glm::convertRgbToSrgb(ColorSourceRGB, 2.8f); + glm::vec3 const ColorRGB = glm::convertSrgbToRgb(ColorSRGB, 2.8f); Error += glm::all(glm::epsilonEqual(ColorSourceRGB, ColorRGB, 0.00001f)) ? 0 : 1; } + glm::vec4 const ColorSourceRGBA(1.0, 0.5, 0.0, 1.0); + + { + glm::vec4 const ColorSRGB = glm::convertRgbToSrgb(ColorSourceRGBA); + glm::vec4 const ColorRGB = glm::convertSrgbToRgb(ColorSRGB); + Error += glm::all(glm::epsilonEqual(ColorSourceRGBA, ColorRGB, 0.00001f)) ? 0 : 1; + } + + { + glm::vec4 const ColorSRGB = glm::convertRgbToSrgb(ColorSourceRGBA, 2.8f); + glm::vec4 const ColorRGB = glm::convertSrgbToRgb(ColorSRGB, 2.8f); + Error += glm::all(glm::epsilonEqual(ColorSourceRGBA, ColorRGB, 0.00001f)) ? 0 : 1; + } + return Error; } }//namespace srgb diff --git a/test/gtx/gtx_fast_trigonometry.cpp b/test/gtx/gtx_fast_trigonometry.cpp index eb73157b..46faffd5 100644 --- a/test/gtx/gtx_fast_trigonometry.cpp +++ b/test/gtx/gtx_fast_trigonometry.cpp @@ -31,10 +31,16 @@ #include #include +#include +#include #include #include +#include +#include +#include #include #include +#include namespace fastCos { @@ -43,12 +49,15 @@ namespace fastCos const float begin = -glm::pi(); const float end = glm::pi(); float result = 0.f; + const std::clock_t timestamp1 = std::clock(); - for(float i=begin; i(); const float end = glm::pi(); float result = 0.f; + const std::clock_t timestamp1 = std::clock(); - for (float i = begin; i(); const float end = glm::pi(); float result = 0.f; + const std::clock_t timestamp1 = std::clock(); - for (float i = begin; i(); const float end = glm::pi(); float result = 0.f; + const std::clock_t timestamp1 = std::clock(); - for (float i = begin; i(time_fast)); std::printf("acos Time %d clocks\n", static_cast(time_default)); @@ -144,10 +163,10 @@ namespace fastAsin const float end = glm::pi(); float result = 0.f; const std::clock_t timestamp1 = std::clock(); - for (float i = begin; i(); float result = 0.f; const std::clock_t timestamp1 = std::clock(); - for (float i = begin; i() * 0.5f, glm::pi() * 1.0f, glm::pi() * 1.5f); + + template class vecType> + GLM_FUNC_QUALIFIER vecType taylorSeriesNewCos(vecType const & x) + { + vecType const Powed2(x * x); + vecType const Powed4(Powed2 * Powed2); + vecType const Powed6(Powed4 * Powed2); + vecType const Powed8(Powed4 * Powed4); + + return static_cast(1) + - Powed2 * static_cast(0.5) + + Powed4 * static_cast(0.04166666666666666666666666666667) + - Powed6 * static_cast(0.00138888888888888888888888888889) + + Powed8 * static_cast(2.4801587301587301587301587301587e-5); + } + + template class vecType> + GLM_FUNC_QUALIFIER vecType taylorSeriesNewCos6(vecType const & x) + { + vecType const Powed2(x * x); + vecType const Powed4(Powed2 * Powed2); + vecType const Powed6(Powed4 * Powed2); + + return static_cast(1) + - Powed2 * static_cast(0.5) + + Powed4 * static_cast(0.04166666666666666666666666666667) + - Powed6 * static_cast(0.00138888888888888888888888888889); + } + + template class vecType> + GLM_FUNC_QUALIFIER vecType fastAbs(vecType x) + { + int* Pointer = reinterpret_cast(&x[0]); + *(((int *) &Pointer[0]) + 1) &= 0x7fffffff; + *(((int *) &Pointer[1]) + 1) &= 0x7fffffff; + *(((int *) &Pointer[2]) + 1) &= 0x7fffffff; + *(((int *) &Pointer[3]) + 1) &= 0x7fffffff; + return x; + } + + template class vecType> + GLM_FUNC_QUALIFIER vecType fastCosNew(vecType const & x) + { + vecType const Angle0_PI(fastAbs(fmod(x + glm::pi(), glm::two_pi()) - glm::pi())); + return taylorSeriesNewCos6(x); +/* + vecType const FirstQuarterPi(lessThanEqual(Angle0_PI, vecType(glm::half_pi()))); + + vecType const RevertAngle(mix(vecType(glm::pi()), vecType(0), FirstQuarterPi)); + vecType const ReturnSign(mix(vecType(-1), vecType(1), FirstQuarterPi)); + vecType const SectionAngle(RevertAngle - Angle0_PI); + + return ReturnSign * taylorSeriesNewCos(SectionAngle); +*/ + } + + int perf_fastCosNew(float Begin, float End, std::size_t Samples) + { + std::vector Results; + Results.resize(Samples); + + float Steps = (End - Begin) / Samples; + + std::clock_t const TimeStampBegin = std::clock(); + + for(std::size_t i = 0; i < Samples; ++i) + Results[i] = taylorCos::fastCosNew(AngleShift + glm::vec4(Begin + Steps * i)); + + std::clock_t const TimeStampEnd = std::clock(); + + std::printf("fastCosNew %ld clocks\n", TimeStampEnd - TimeStampBegin); + + int Error = 0; + for(std::size_t i = 0; i < Samples; ++i) + Error += Results[i].x >= -1.0f && Results[i].x <= 1.0f ? 0 : 1; + return Error; + } + + template class vecType> + GLM_FUNC_QUALIFIER vecType deterministic_fmod(vecType const & x, T y) + { + return x - y * trunc(x / y); + } + + template class vecType> + GLM_FUNC_QUALIFIER vecType fastCosDeterminisctic(vecType const & x) + { + vecType const Angle0_PI(abs(deterministic_fmod(x + glm::pi(), glm::two_pi()) - glm::pi())); + vecType const FirstQuarterPi(lessThanEqual(Angle0_PI, vecType(glm::half_pi()))); + + vecType const RevertAngle(mix(vecType(glm::pi()), vecType(0), FirstQuarterPi)); + vecType const ReturnSign(mix(vecType(-1), vecType(1), FirstQuarterPi)); + vecType const SectionAngle(RevertAngle - Angle0_PI); + + return ReturnSign * taylorSeriesNewCos(SectionAngle); + } + + int perf_fastCosDeterminisctic(float Begin, float End, std::size_t Samples) + { + std::vector Results; + Results.resize(Samples); + + float Steps = (End - Begin) / Samples; + + std::clock_t const TimeStampBegin = std::clock(); + + for(std::size_t i = 0; i < Samples; ++i) + Results[i] = taylorCos::fastCosDeterminisctic(AngleShift + glm::vec4(Begin + Steps * i)); + + std::clock_t const TimeStampEnd = std::clock(); + + std::printf("fastCosDeterminisctic %ld clocks\n", TimeStampEnd - TimeStampBegin); + + int Error = 0; + for(std::size_t i = 0; i < Samples; ++i) + Error += Results[i].x >= -1.0f && Results[i].x <= 1.0f ? 0 : 1; + return Error; + } + + template class vecType> + GLM_FUNC_QUALIFIER vecType taylorSeriesRefCos(vecType const & x) + { + return static_cast(1) + - (x * x) / glm::factorial(static_cast(2)) + + (x * x * x * x) / glm::factorial(static_cast(4)) + - (x * x * x * x * x * x) / glm::factorial(static_cast(6)) + + (x * x * x * x * x * x * x * x) / glm::factorial(static_cast(8)); + } + + template class vecType> + GLM_FUNC_QUALIFIER vecType fastRefCos(vecType const & x) + { + vecType const Angle0_PI(glm::abs(fmod(x + glm::pi(), glm::two_pi()) - glm::pi())); +// return taylorSeriesRefCos(Angle0_PI); + + vecType const FirstQuarterPi(lessThanEqual(Angle0_PI, vecType(glm::half_pi()))); + + vecType const RevertAngle(mix(vecType(glm::pi()), vecType(0), FirstQuarterPi)); + vecType const ReturnSign(mix(vecType(-1), vecType(1), FirstQuarterPi)); + vecType const SectionAngle(RevertAngle - Angle0_PI); + + return ReturnSign * taylorSeriesRefCos(SectionAngle); + } + + int perf_fastCosRef(float Begin, float End, std::size_t Samples) + { + std::vector Results; + Results.resize(Samples); + + float Steps = (End - Begin) / Samples; + + std::clock_t const TimeStampBegin = std::clock(); + + for(std::size_t i = 0; i < Samples; ++i) + Results[i] = taylorCos::fastRefCos(AngleShift + glm::vec4(Begin + Steps * i)); + + std::clock_t const TimeStampEnd = std::clock(); + + std::printf("fastCosRef %ld clocks\n", TimeStampEnd - TimeStampBegin); + + int Error = 0; + for(std::size_t i = 0; i < Samples; ++i) + Error += Results[i].x >= -1.0f && Results[i].x <= 1.0f ? 0 : 1; + return Error; + } + + int perf_fastCosOld(float Begin, float End, std::size_t Samples) + { + std::vector Results; + Results.resize(Samples); + + float Steps = (End - Begin) / Samples; + + std::clock_t const TimeStampBegin = std::clock(); + + for(std::size_t i = 0; i < Samples; ++i) + Results[i] = glm::fastCos(AngleShift + glm::vec4(Begin + Steps * i)); + + std::clock_t const TimeStampEnd = std::clock(); + + std::printf("fastCosOld %ld clocks\n", TimeStampEnd - TimeStampBegin); + + int Error = 0; + for(std::size_t i = 0; i < Samples; ++i) + Error += Results[i].x >= -1.0f && Results[i].x <= 1.0f ? 0 : 1; + return Error; + } + + int perf_cos(float Begin, float End, std::size_t Samples) + { + std::vector Results; + Results.resize(Samples); + + float Steps = (End - Begin) / Samples; + + std::clock_t const TimeStampBegin = std::clock(); + + for(std::size_t i = 0; i < Samples; ++i) + Results[i] = glm::cos(AngleShift + glm::vec4(Begin + Steps * i)); + + std::clock_t const TimeStampEnd = std::clock(); + + std::printf("cos %ld clocks\n", TimeStampEnd - TimeStampBegin); + + int Error = 0; + for(std::size_t i = 0; i < Samples; ++i) + Error += Results[i].x >= -1.0f && Results[i].x <= 1.0f ? 0 : 1; + return Error; + } + + int perf() + { + int Error = 0; + + float const Begin = -glm::pi(); + float const End = glm::pi(); + std::size_t const Samples = 10000000; + + Error += perf_cos(Begin, End, Samples); + Error += perf_fastCosOld(Begin, End, Samples); + Error += perf_fastCosRef(Begin, End, Samples); + //Error += perf_fastCosNew(Begin, End, Samples); + Error += perf_fastCosDeterminisctic(Begin, End, Samples); + + return Error; + } + + int test() + { + int Error = 0; + + //for(float Angle = -4.0f * glm::pi(); Angle < 4.0f * glm::pi(); Angle += 0.1f) + //for(float Angle = -720.0f; Angle < 720.0f; Angle += 0.1f) + for(float Angle = 0.0f; Angle < 180.0f; Angle += 0.1f) + { + float const modAngle = std::fmod(glm::abs(Angle), 360.f); + assert(modAngle >= 0.0f && modAngle <= 360.f); + float const radAngle = glm::radians(modAngle); + float const Cos0 = std::cos(radAngle); + + float const Cos1 = taylorCos::fastRefCos(glm::fvec1(radAngle)).x; + Error += glm::abs(Cos1 - Cos0) < 0.1f ? 0 : 1; + + float const Cos2 = taylorCos::fastCosNew(glm::fvec1(radAngle)).x; + //Error += glm::abs(Cos2 - Cos0) < 0.1f ? 0 : 1; + + assert(!Error); + } + + return Error; + } +}//namespace taylorCos + int main() { int Error(0); + Error += ::taylorCos::test(); + Error += ::taylorCos::perf(); + # ifdef NDEBUG Error += ::fastCos::perf(); Error += ::fastSin::perf();