From 29a42f48fcddf51bdf0ae640aa2513f1091e10d3 Mon Sep 17 00:00:00 2001 From: Vito Caputo Date: Fri, 21 Jul 2023 15:39:46 -0700 Subject: modules/shapes: drop atan2_approx() With the addition of the "radcache" in b6362c, the need for a faster approximate atan2f() is largely eliminated. And there seems to be a bug in the implementation as-is taken from https://mazzo.li/posts/vectorized-atan2.html You can see the bug as vertical line artifact around the center where the X coordinate would be 0. Rather than debug what's wrong with this approximation's implementation surrounding its quadrant adjustments, let's just resume using atan2f() and let the cache keep things quick. --- src/modules/shapes/shapes.c | 47 ++++----------------------------------------- 1 file changed, 4 insertions(+), 43 deletions(-) (limited to 'src') diff --git a/src/modules/shapes/shapes.c b/src/modules/shapes/shapes.c index 3943652..b32d7ce 100644 --- a/src/modules/shapes/shapes.c +++ b/src/modules/shapes/shapes.c @@ -238,45 +238,6 @@ static void shapes_prepare_frame(til_module_context_t *context, til_stream_t *st } -/* simple approximation taken from https://mazzo.li/posts/vectorized-atan2.html */ -static inline float atan_scalar_approximation(float x) { - /* TODO: this is probably more terms/precision than needed, but when I try just dropping some, - * the circle+slight pinches gets artifacts. So leaving for now, probably needs slightly different - * values for fewer terms. - */ - float a1 = 0.99997726f; - float a3 = -0.33262347f; - float a5 = 0.19354346f; - float a7 = -0.11643287f; - float a9 = 0.05265332f; - float a11 = -0.01172120f; - float x_sq = x*x; - - return x * (a1 + x_sq * (a3 + x_sq * (a5 + x_sq * (a7 + x_sq * (a9 + x_sq * a11))))); -} - - -static float atan2_approx(float y, float x) { - // Ensure input is in [-1, +1] - int swap = fabs(x) < fabs(y); - float atan_input = (swap ? x : y) / (swap ? y : x); - - // Approximate atan - float res = atan_scalar_approximation(atan_input); - - // If swapped, adjust atan output - res = swap ? (atan_input >= 0.0f ? M_PI_2 : -M_PI_2) - res : res; - - // Adjust quadrants - if (x < 0.0f && y >= 0.0f) - res = M_PI + res; // 2nd quadrant - else if (x < 0.0f && y < 0.0f) - res = -M_PI + res; // 3rd quadrant - - return res; -} - - static void shapes_render_fragment(til_module_context_t *context, til_stream_t *stream, unsigned ticks, unsigned cpu, til_fb_fragment_t **fragment_ptr) { shapes_context_t *ctxt = (shapes_context_t *)context; @@ -337,7 +298,7 @@ static void shapes_render_fragment(til_module_context_t *context, til_stream_t * YYY = Y * Y; if (!radcache->initialized) { for (unsigned x = xstart; x < xend; x++, X++, XX += s) { - float a = rads[y * radcache->width + x] = atan2_approx(YY, XX); + float a = rads[y * radcache->width + x] = atan2f(YY, XX); if (YYY+X*X < r_sq * (1.f - fabsf(cosf(n_pinches * a + pinch)) * pinch_s)) til_fb_fragment_put_pixel_unchecked(fragment, TIL_FB_DRAW_FLAG_TEXTURABLE, x, y, 0xffffffff); /* TODO: stop relying on checked for clipping */ @@ -378,7 +339,7 @@ static void shapes_render_fragment(til_module_context_t *context, til_stream_t * YYYY = YY * YY; if (!radcache->initialized) { for (unsigned x = xstart; x < xend; x++, XX += s) { - float a = rads[y * radcache->width + x] = atan2_approx(YY, XX); + float a = rads[y * radcache->width + x] = atan2f(YY, XX); float r = cosf(n_points * (a + spin)) * .5f + .5f; r *= 1.f - fabsf(cosf(n_pinches * (a + pinch))) * pinch_s; @@ -426,7 +387,7 @@ static void shapes_render_fragment(til_module_context_t *context, til_stream_t * X = -(size >> 1) + xskip; if (!radcache->initialized) { for (unsigned x = xstart; x < xend; x++, X++, XX += s) { - float a = rads[y * radcache->width + x] = atan2_approx(YY, XX); + float a = rads[y * radcache->width + x] = atan2f(YY, XX); if (abs(Y) + abs(X) < r * (1.f - fabsf(cosf(n_pinches * a + pinch)) * pinch_s)) til_fb_fragment_put_pixel_unchecked(fragment, TIL_FB_DRAW_FLAG_TEXTURABLE, x, y, 0xffffffff); @@ -466,7 +427,7 @@ static void shapes_render_fragment(til_module_context_t *context, til_stream_t * YYYY = YY * YY; if (!radcache->initialized) { for (unsigned x = xstart; x < xend; x++, XX += s) { - float a = rads[y * radcache->width + x] = atan2_approx(YY, XX); + float a = rads[y * radcache->width + x] = atan2f(YY, XX); float r = (M_2_PI * asinf(sinf(n_points * (a + spin)) * .5f + .5f)) * .5f + .5f; /* ^^^^^^^^^^^^^^^^^^^ approximates a triangle wave */ -- cgit v1.2.3