From 9ba266c21f08139281fd7578d751bed59a2006cb Mon Sep 17 00:00:00 2001
From: Ingo Weyrich <heckflosse67@gmx.de>
Date: Thu, 25 Feb 2021 22:44:50 +0100
Subject: [PATCH 1/6] added some stopwatches

---
 rtengine/ipwavelet.cc | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/rtengine/ipwavelet.cc b/rtengine/ipwavelet.cc
index 4b65dd5bc..eb715f166 100644
--- a/rtengine/ipwavelet.cc
+++ b/rtengine/ipwavelet.cc
@@ -2196,13 +2196,15 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
         
         
     if (thrend > 0.f) {
+        StopWatch Stop0("final touchup");
             //2 decomposition LL after guidefilter and dst before (perhaps dst no need)
         const std::unique_ptr<wavelet_decomposition> LdecompLL(new wavelet_decomposition(LL[0], ww, hh, levwavL, 1, skip, rtengine::max(1, wavNestedLevels), DaubLen));
         const std::unique_ptr<wavelet_decomposition> Ldecompdst(new wavelet_decomposition(dst->L[0], ww, hh, levwavL, 1, skip, rtengine::max(1, wavNestedLevels), DaubLen));
         if (!LdecompLL->memory_allocation_failed() && !Ldecompdst->memory_allocation_failed()) {
-
+            StopWatch Stop1("Evaluate2");
             Evaluate2(*LdecompLL, meang, meanNg, sigmag, sigmaNg, MaxPg, MaxNg, wavNestedLevels);
             Evaluate2(*Ldecompdst, mean, meanN, sigma, sigmaN, MaxP, MaxN, wavNestedLevels);
+            Stop1.stop();
             float sig = 2.f;
             float thr = 0.f;
             if(thrend < 0.02f) thr = 0.5f;
@@ -2214,6 +2216,7 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
                 0, 1, 0.35, 0.35,thrend, 1.0, 0.35, 0.35, thrend + 0.01f, thr, 0.35, 0.35, 1, thr, 0.35, 0.35
             });
 
+            StopWatch Stop2("level loops");
             for (int dir = 1; dir < 4; dir++) {
                 for (int level = 0; level < levwavL-1; level++) {
                     int Wlvl_L = LdecompLL->level_W(level);
@@ -2281,6 +2284,7 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
                     }
                 }
             }
+            Stop2.stop();
             LdecompLL->reconstruct(LL[0], cp.strength);
         }
     }

From 10e0ab4eaaa784ec86437aae00d88d030d4ecea9 Mon Sep 17 00:00:00 2001
From: Ingo Weyrich <heckflosse67@gmx.de>
Date: Thu, 25 Feb 2021 23:10:37 +0100
Subject: [PATCH 2/6] Speedup final touchup local contrast

---
 rtengine/ipwavelet.cc | 86 +++++++++++++++++++------------------------
 1 file changed, 38 insertions(+), 48 deletions(-)

diff --git a/rtengine/ipwavelet.cc b/rtengine/ipwavelet.cc
index eb715f166..3caa9a001 100644
--- a/rtengine/ipwavelet.cc
+++ b/rtengine/ipwavelet.cc
@@ -2196,19 +2196,19 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
         
         
     if (thrend > 0.f) {
-        StopWatch Stop0("final touchup");
-            //2 decomposition LL after guidefilter and dst before (perhaps dst no need)
+        StopWatch Stop0("Final touchup");
+        //2 decomposition LL after guidefilter and dst before (perhaps dst no need)
         const std::unique_ptr<wavelet_decomposition> LdecompLL(new wavelet_decomposition(LL[0], ww, hh, levwavL, 1, skip, rtengine::max(1, wavNestedLevels), DaubLen));
         const std::unique_ptr<wavelet_decomposition> Ldecompdst(new wavelet_decomposition(dst->L[0], ww, hh, levwavL, 1, skip, rtengine::max(1, wavNestedLevels), DaubLen));
         if (!LdecompLL->memory_allocation_failed() && !Ldecompdst->memory_allocation_failed()) {
-            StopWatch Stop1("Evaluate2");
+StopWatch Stop1("evaluate");
             Evaluate2(*LdecompLL, meang, meanNg, sigmag, sigmaNg, MaxPg, MaxNg, wavNestedLevels);
             Evaluate2(*Ldecompdst, mean, meanN, sigma, sigmaN, MaxP, MaxN, wavNestedLevels);
-            Stop1.stop();
-            float sig = 2.f;
+Stop1.stop();
+            constexpr float sig = 2.f;
             float thr = 0.f;
-            if(thrend < 0.02f) thr = 0.5f;
-            else if(thrend < 0.1f) thr = 0.2f;
+            if (thrend < 0.02f) thr = 0.5f;
+            else if (thrend < 0.1f) thr = 0.2f;
             else thr = 0.f;
 
             FlatCurve wavguid({
@@ -2219,34 +2219,29 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
             StopWatch Stop2("level loops");
             for (int dir = 1; dir < 4; dir++) {
                 for (int level = 0; level < levwavL-1; level++) {
-                    int Wlvl_L = LdecompLL->level_W(level);
-                    int Hlvl_L = LdecompLL->level_H(level);
+                    const int Wlvl_L = LdecompLL->level_W(level);
+                    const int Hlvl_L = LdecompLL->level_H(level);
                     float* const* WavCoeffs_L = LdecompLL->level_coeffs(level);//first decomp denoised
                     float* const* WavCoeffs_L2 = Ldecompdst->level_coeffs(level);//second decomp before denoise
                     if (settings->verbose) {
                         printf("level=%i mean=%.0f meanden=%.0f sigma=%.0f  sigmaden=%.0f Max=%.0f Maxden=%.0f\n", level, mean[level], meang[level], sigma[level], sigmag[level],MaxP[level], MaxPg[level]);
                     }
 
-                                            //find local contrast
-                    float tempmean = 0.f;
-                    float tempsig = 0.f;
-                    float tempmax = 0.f;
-                    tempmean = 0.3f * mean[level] + 0.7f * meang[level] ;
-                    tempsig = 0.3f * sigma[level] + 0.7f * sigmag[level] ;
-                    tempmax = 0.3f * MaxP[level] + 0.7f * MaxPg[level] ;
+                    //find local contrast
+                    const float tempmean = 0.3f * mean[level] + 0.7f * meang[level];
+                    const float tempsig = 0.3f * sigma[level] + 0.7f * sigmag[level];
+                    const float tempmax = 0.3f * MaxP[level] + 0.7f * MaxPg[level];
                                             
                     if (MaxP[level] > 0.f && mean[level] != 0.f && sigma[level] != 0.f) { //curve
-                        float insigma = 0.666f; //SD
-                        float logmax = log(tempmax); //log Max
-                                                //cp.sigmm change the "wider" of sigma
-                        float rapX = (tempmean + sig * tempsig) / (tempmax); //rapport between sD / max
-                        float inx = log(insigma);
-                        float iny = log(rapX);
-                        float rap = inx / iny; //koef
-                        float asig = 0.166f / (tempsig * sig);
-                        float bsig = 0.5f - asig * tempmean;
-                        float amean = 0.5f / (tempmean);
-                    
+                        constexpr float insigma = 0.666f; //SD
+                        const float logmax = log(tempmax); //log Max
+                        const float rapX = (tempmean + sig * tempsig) / tempmax; //rapport between sD / max
+                        constexpr float inx = log(insigma);
+                        const float iny = log(rapX);
+                        const float rap = inx / iny; //koef
+                        const float asig = 0.166f / (tempsig * sig);
+                        const float bsig = 0.5f - asig * tempmean;
+                        const float amean = 1.f / tempmean;
 
 #ifdef _OPENMP
         #pragma omp parallel for schedule(dynamic, Wlvl_L * 16) num_threads(wavNestedLevels) if (wavNestedLevels>1)
@@ -2254,32 +2249,27 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
 
                         for (int i = 0; i < Wlvl_L * Hlvl_L; i++) {
                             float absciss;
-                            float tempwav = 0.f;
-                            tempwav = 0.7f * WavCoeffs_L[dir][i] + 0.3f * WavCoeffs_L2[dir][i];
+                            const float tempwav = std::fabs(0.7f * WavCoeffs_L[dir][i] + 0.3f * WavCoeffs_L2[dir][i]);
 
-                            if (std::fabs(tempwav) >= (tempmean + sig * tempsig)) { //for max
-                                float valcour = xlogf(std::fabs(tempwav));
-                                float valc = valcour - logmax;
-                                float vald = valc * rap;
+                            if (tempwav >= tempmean + sig * tempsig) { //for max
+                                const float vald = (xlogf(tempwav) - logmax) * rap;
                                 absciss = xexpf(vald);
-                            } else if (std::fabs(tempwav) >= tempmean) {
-                                absciss = asig * std::fabs(tempwav) + bsig;
+                            } else if (tempwav >= tempmean) {
+                                absciss = asig * tempwav + bsig;
                             } else {
-                                absciss = amean * std::fabs(tempwav);
-                                float abs = pow(2.f * absciss, (1.f / SQR(sig)));
-                                absciss = 0.5f * abs;
+                                absciss = amean * tempwav;
+                                if (sig == 2.f) { // for sig = 2.f we can use a faster calculation because the exponent in this case is 0.25
+                                    absciss = 0.5f * std::sqrt(std::sqrt(absciss));
+                                } else {
+                                    absciss = 0.5f * pow_F(absciss, 1.f / SQR(sig));
+                                }
                             }
-                            float kc = wavguid.getVal(absciss) -1.f;
+                            float kc = wavguid.getVal(absciss) - 1.f;
+                            kc = kc < 0.f ? -SQR(kc) : kc; // approximation to simulate sliders denoise
 
-                            if(kc < 0) {
-                                kc = -SQR(kc);//approximation to simulate sliders denoise
-                            }
-                            float reduceeffect = kc <= 0.f ? 1.f : 1.2f;//1.2 allows to increase denoise (not used)
-
-                            float kinterm = 1.f + reduceeffect * kc;
-                            kinterm = kinterm <= 0.f ? 0.01f : kinterm;
-                            float prov = WavCoeffs_L2[dir][i];//save before denoise
-                            WavCoeffs_L[dir][i] = prov + (WavCoeffs_L[dir][i] - prov) * kinterm;//only apply local contrast on difference between denoise and normal
+                            const float reduceeffect = kc <= 0.f ? 1.f : 1.2f;//1.2 allows to increase denoise (not used)
+                            const float kinterm = rtengine::max(1.f + reduceeffect * kc, 0.f);
+                            WavCoeffs_L[dir][i] = intp(kinterm, WavCoeffs_L[dir][i], WavCoeffs_L2[dir][i]); // interpolate using kinterm
                         }
                     }
                 }

From d7327e8b05498b02be5bcef84962ea7d96e1c61f Mon Sep 17 00:00:00 2001
From: Ingo Weyrich <heckflosse67@gmx.de>
Date: Fri, 26 Feb 2021 12:41:23 +0100
Subject: [PATCH 3/6] left original code in comments

---
 rtengine/ipwavelet.cc | 20 ++++++++++++--------
 1 file changed, 12 insertions(+), 8 deletions(-)

diff --git a/rtengine/ipwavelet.cc b/rtengine/ipwavelet.cc
index 3caa9a001..1c53992b6 100644
--- a/rtengine/ipwavelet.cc
+++ b/rtengine/ipwavelet.cc
@@ -2196,16 +2196,19 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
         
         
     if (thrend > 0.f) {
-        StopWatch Stop0("Final touchup");
         //2 decomposition LL after guidefilter and dst before (perhaps dst no need)
         const std::unique_ptr<wavelet_decomposition> LdecompLL(new wavelet_decomposition(LL[0], ww, hh, levwavL, 1, skip, rtengine::max(1, wavNestedLevels), DaubLen));
         const std::unique_ptr<wavelet_decomposition> Ldecompdst(new wavelet_decomposition(dst->L[0], ww, hh, levwavL, 1, skip, rtengine::max(1, wavNestedLevels), DaubLen));
         if (!LdecompLL->memory_allocation_failed() && !Ldecompdst->memory_allocation_failed()) {
-StopWatch Stop1("evaluate");
             Evaluate2(*LdecompLL, meang, meanNg, sigmag, sigmaNg, MaxPg, MaxNg, wavNestedLevels);
             Evaluate2(*Ldecompdst, mean, meanN, sigma, sigmaN, MaxP, MaxN, wavNestedLevels);
-Stop1.stop();
             constexpr float sig = 2.f;
+            /* original code for variable sig
+            float k = sig;
+            if (sig > 1.f) {
+                k = SQR(sig);
+            }
+            */
             float thr = 0.f;
             if (thrend < 0.02f) thr = 0.5f;
             else if (thrend < 0.1f) thr = 0.2f;
@@ -2216,7 +2219,6 @@ Stop1.stop();
                 0, 1, 0.35, 0.35,thrend, 1.0, 0.35, 0.35, thrend + 0.01f, thr, 0.35, 0.35, 1, thr, 0.35, 0.35
             });
 
-            StopWatch Stop2("level loops");
             for (int dir = 1; dir < 4; dir++) {
                 for (int level = 0; level < levwavL-1; level++) {
                     const int Wlvl_L = LdecompLL->level_W(level);
@@ -2258,11 +2260,15 @@ Stop1.stop();
                                 absciss = asig * tempwav + bsig;
                             } else {
                                 absciss = amean * tempwav;
+                                /*
                                 if (sig == 2.f) { // for sig = 2.f we can use a faster calculation because the exponent in this case is 0.25
-                                    absciss = 0.5f * std::sqrt(std::sqrt(absciss));
+                                */
+                                absciss = 0.5f * std::sqrt(std::sqrt(absciss));
+                                /* original code for variable sig
                                 } else {
-                                    absciss = 0.5f * pow_F(absciss, 1.f / SQR(sig));
+                                    absciss = 0.5f * pow_F(absciss, 1.f / k);
                                 }
+                                */
                             }
                             float kc = wavguid.getVal(absciss) - 1.f;
                             kc = kc < 0.f ? -SQR(kc) : kc; // approximation to simulate sliders denoise
@@ -2274,12 +2280,10 @@ Stop1.stop();
                     }
                 }
             }
-            Stop2.stop();
             LdecompLL->reconstruct(LL[0], cp.strength);
         }
     }
 
-        
         //end local contrast
 #ifdef _OPENMP
         #pragma omp parallel for

From d3c536b0d8711ba62eeb23cac66fed718f9a3e5c Mon Sep 17 00:00:00 2001
From: Ingo Weyrich <heckflosse67@gmx.de>
Date: Fri, 26 Feb 2021 13:01:02 +0100
Subject: [PATCH 4/6] Fix clang build

---
 rtengine/ipwavelet.cc | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/rtengine/ipwavelet.cc b/rtengine/ipwavelet.cc
index 1c53992b6..07610d0d9 100644
--- a/rtengine/ipwavelet.cc
+++ b/rtengine/ipwavelet.cc
@@ -2238,7 +2238,7 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
                         constexpr float insigma = 0.666f; //SD
                         const float logmax = log(tempmax); //log Max
                         const float rapX = (tempmean + sig * tempsig) / tempmax; //rapport between sD / max
-                        constexpr float inx = log(insigma);
+                        const float inx = log(insigma);
                         const float iny = log(rapX);
                         const float rap = inx / iny; //koef
                         const float asig = 0.166f / (tempsig * sig);

From fb72b6c62678118e0b88922c578a54afe7d6d1b1 Mon Sep 17 00:00:00 2001
From: Ingo Weyrich <heckflosse67@gmx.de>
Date: Fri, 26 Feb 2021 13:47:08 +0100
Subject: [PATCH 5/6] Keep original code, Optimizer will catch that

---
 rtengine/ipwavelet.cc | 13 +++++--------
 1 file changed, 5 insertions(+), 8 deletions(-)

diff --git a/rtengine/ipwavelet.cc b/rtengine/ipwavelet.cc
index 07610d0d9..fe172c001 100644
--- a/rtengine/ipwavelet.cc
+++ b/rtengine/ipwavelet.cc
@@ -2203,12 +2203,13 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
             Evaluate2(*LdecompLL, meang, meanNg, sigmag, sigmaNg, MaxPg, MaxNg, wavNestedLevels);
             Evaluate2(*Ldecompdst, mean, meanN, sigma, sigmaN, MaxP, MaxN, wavNestedLevels);
             constexpr float sig = 2.f;
-            /* original code for variable sig
+
+            // original code for variable sig
             float k = sig;
             if (sig > 1.f) {
                 k = SQR(sig);
             }
-            */
+
             float thr = 0.f;
             if (thrend < 0.02f) thr = 0.5f;
             else if (thrend < 0.1f) thr = 0.2f;
@@ -2260,15 +2261,11 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
                                 absciss = asig * tempwav + bsig;
                             } else {
                                 absciss = amean * tempwav;
-                                /*
                                 if (sig == 2.f) { // for sig = 2.f we can use a faster calculation because the exponent in this case is 0.25
-                                */
-                                absciss = 0.5f * std::sqrt(std::sqrt(absciss));
-                                /* original code for variable sig
-                                } else {
+                                    absciss = 0.5f * std::sqrt(std::sqrt(absciss));
+                                } else { // original code for variable sig
                                     absciss = 0.5f * pow_F(absciss, 1.f / k);
                                 }
-                                */
                             }
                             float kc = wavguid.getVal(absciss) - 1.f;
                             kc = kc < 0.f ? -SQR(kc) : kc; // approximation to simulate sliders denoise

From 4f880b346a28fbcebf4788568f2c3506c6f3b98f Mon Sep 17 00:00:00 2001
From: Ingo Weyrich <heckflosse67@gmx.de>
Date: Fri, 26 Feb 2021 14:19:52 +0100
Subject: [PATCH 6/6] add a cppcheck-suppress

---
 rtengine/ipwavelet.cc | 1 +
 1 file changed, 1 insertion(+)

diff --git a/rtengine/ipwavelet.cc b/rtengine/ipwavelet.cc
index fe172c001..3eeba7a82 100644
--- a/rtengine/ipwavelet.cc
+++ b/rtengine/ipwavelet.cc
@@ -2206,6 +2206,7 @@ void ImProcFunctions::ip_wavelet(LabImage * lab, LabImage * dst, int kall, const
 
             // original code for variable sig
             float k = sig;
+            // cppcheck-suppress knownConditionTrueFalse
             if (sig > 1.f) {
                 k = SQR(sig);
             }