shithub: opus

Download patch

ref: d4b04d3275af9938c92a386fc9178977f293362c
parent: b2cfd87783713793f4a170bb5a13a1470896436e
author: Jean-Marc Valin <jmvalin@amazon.com>
date: Fri Nov 17 18:10:59 EST 2023

Speed up silk_warped_autocorrelation_FLP()

Reducing the dependency chain between tmp1 and tmp2 at the
cost of an extra multiply.

--- a/silk/float/warped_autocorrelation_FLP.c
+++ b/silk/float/warped_autocorrelation_FLP.c
@@ -54,11 +54,13 @@
         /* Loop over allpass sections */
         for( i = 0; i < order; i += 2 ) {
             /* Output of allpass section */
-            tmp2 = state[ i ] + warping * ( state[ i + 1 ] - tmp1 );
+            /* We voluntarily use two multiples instead of factoring the expression to
+               reduce the length of the dependency chain (tmp1->tmp2->tmp1... ). */
+            tmp2 = state[ i ] + warping * state[ i + 1 ] - warping * tmp1;
             state[ i ] = tmp1;
             C[ i ] += state[ 0 ] * tmp1;
             /* Output of allpass section */
-            tmp1 = state[ i + 1 ] + warping * ( state[ i + 2 ] - tmp2 );
+            tmp1 = state[ i + 1 ] + warping * state[ i + 2 ] - warping * tmp2;
             state[ i + 1 ] = tmp2;
             C[ i + 1 ] += state[ 0 ] * tmp2;
         }
--