[FFmpeg-devel] [PATCH] checkasm: add test for dcmul_add

flow gg hlefthleft at gmail.com
Sun Nov 19 00:28:10 EET 2023


>From 2785ce57f68dbb2373c951b9432afa73796f7cc1 Mon Sep 17 00:00:00 2001
From: sunyuechi <sunyuechi at iscas.ac.cn>
Date: Sat, 18 Nov 2023 10:58:17 +0800
Subject: [PATCH] checkasm: test for dcmul_add

---
 tests/checkasm/af_afir.c | 141 +++++++++++++++++++++++++++------------
 1 file changed, 98 insertions(+), 43 deletions(-)

diff --git a/tests/checkasm/af_afir.c b/tests/checkasm/af_afir.c
index 08c55dacfc..6cb59dbb6c 100644
--- a/tests/checkasm/af_afir.c
+++ b/tests/checkasm/af_afir.c
@@ -33,64 +33,119 @@ do {                                          \
     int i;                                    \
     double bmg[2], stddev = 10.0, mean = 0.0; \
                                               \
-    for (i = 0; i < LEN*2+8; i += 2) {        \
+    for (i = 0; i < BUF_SIZE; i += 2) {        \
         av_bmg_get(&checkasm_lfg, bmg);       \
         buf[i]     = bmg[0] * stddev + mean;  \
         buf[i + 1] = bmg[1] * stddev + mean;  \
     }                                         \
 } while(0);

-static void test_fcmul_add(const float *src0, const float *src1, const
float *src2)
+static void test_fcmul_add(AudioFIRDSPContext *fir)
 {
-    LOCAL_ALIGNED_32(float, cdst, [LEN*2+8]);
-    LOCAL_ALIGNED_32(float, odst, [LEN*2+8]);
-    int i;
-
-    declare_func(void, float *sum, const float *t, const float *c,
-                 ptrdiff_t len);
-
-    memcpy(cdst, src0, (LEN*2+8) * sizeof(float));
-    memcpy(odst, src0, (LEN*2+8) * sizeof(float));
-    call_ref(cdst, src1, src2, LEN);
-    call_new(odst, src1, src2, LEN);
-    for (i = 0; i <= LEN*2; i++) {
-        int idx = i & ~1;
-        float cre = src2[idx];
-        float cim = src2[idx + 1];
-        float tre = src1[idx];
-        float tim = src1[idx + 1];
-        double t = fabs(src0[i]) +
-                   fabs(tre) + fabs(tim) + fabs(cre) + fabs(cim) +
-                   fabs(tre * cre) + fabs(tim * cim) +
-                   fabs(tre * cim) + fabs(tim * cre) +
-                   fabs(tre * cre - tim * cim) +
-                   fabs(tre * cim + tim * cre) +
-                   fabs(cdst[i]) + 1.0;
-        if (!float_near_abs_eps(cdst[i], odst[i], t * 2 * FLT_EPSILON)) {
-            fprintf(stderr, "%d: %- .12f - %- .12f = % .12g\n",
-                    i, cdst[i], odst[i], cdst[i] - odst[i]);
-            fail();
-            break;
+#define BUF_SIZE LEN*2+8
+    LOCAL_ALIGNED_32(float, src0, [BUF_SIZE]);
+    LOCAL_ALIGNED_32(float, src1, [BUF_SIZE]);
+    LOCAL_ALIGNED_32(float, src2, [BUF_SIZE]);
+
+    randomize_buffer(src0);
+    randomize_buffer(src1);
+    randomize_buffer(src2);
+
+    if (check_func(fir->fcmul_add, "fcmul_add")) {
+        LOCAL_ALIGNED_32(float, cdst, [BUF_SIZE]);
+        LOCAL_ALIGNED_32(float, odst, [BUF_SIZE]);
+        int i;
+
+        declare_func(void, float *sum, const float *t, const float *c,
+                     ptrdiff_t len);
+
+        memcpy(cdst, src0, (BUF_SIZE) * sizeof(float));
+        memcpy(odst, src0, (BUF_SIZE) * sizeof(float));
+        call_ref(cdst, src1, src2, LEN);
+        call_new(odst, src1, src2, LEN);
+        for (i = 0; i <= LEN*2; i++) {
+            int idx = i & ~1;
+            float cre = src2[idx];
+            float cim = src2[idx + 1];
+            float tre = src1[idx];
+            float tim = src1[idx + 1];
+            double t = fabs(src0[i]) +
+                       fabs(tre) + fabs(tim) + fabs(cre) + fabs(cim) +
+                       fabs(tre * cre) + fabs(tim * cim) +
+                       fabs(tre * cim) + fabs(tim * cre) +
+                       fabs(tre * cre - tim * cim) +
+                       fabs(tre * cim + tim * cre) +
+                       fabs(cdst[i]) + 1.0;
+            if (!float_near_abs_eps(cdst[i], odst[i], t * 2 *
FLT_EPSILON)) {
+                fprintf(stderr, "%d: %- .12f - %- .12f = % .12g\n",
+                        i, cdst[i], odst[i], cdst[i] - odst[i]);
+                fail();
+                break;
+            }
         }
+        memcpy(odst, src0, (BUF_SIZE) * sizeof(float));
+        bench_new(odst, src1, src2, LEN);
     }
-    memcpy(odst, src0, (LEN*2+8) * sizeof(float));
-    bench_new(odst, src1, src2, LEN);
+
+    report("fcmul_add");
 }

-void checkasm_check_afir(void)
+static void test_dcmul_add(AudioFIRDSPContext *fir)
 {
-    LOCAL_ALIGNED_32(float, src0, [LEN*2+8]);
-    LOCAL_ALIGNED_32(float, src1, [LEN*2+8]);
-    LOCAL_ALIGNED_32(float, src2, [LEN*2+8]);
-    AudioFIRDSPContext fir = { 0 };
-
-    ff_afir_init(&fir);
+#define BUF_SIZE LEN*2+8
+    LOCAL_ALIGNED_32(double, src0, [BUF_SIZE]);
+    LOCAL_ALIGNED_32(double, src1, [BUF_SIZE]);
+    LOCAL_ALIGNED_32(double, src2, [BUF_SIZE]);

     randomize_buffer(src0);
     randomize_buffer(src1);
     randomize_buffer(src2);

-    if (check_func(fir.fcmul_add, "fcmul_add"))
-        test_fcmul_add(src0, src1, src2);
-    report("fcmul_add");
+    if (check_func(fir->dcmul_add, "dcmul_add")) {
+        LOCAL_ALIGNED_32(double, cdst, [BUF_SIZE]);
+        LOCAL_ALIGNED_32(double, odst, [BUF_SIZE]);
+        int i;
+
+        declare_func(void, double *sum, const double *t, const double *c,
+                     ptrdiff_t len);
+
+        memcpy(cdst, src0, (BUF_SIZE) * sizeof(double));
+        memcpy(odst, src0, (BUF_SIZE) * sizeof(double));
+        call_ref(cdst, src1, src2, LEN);
+        call_new(odst, src1, src2, LEN);
+        for (i = 0; i <= LEN*2; i++) {
+            int idx = i & ~1;
+            double cre = src2[idx];
+            double cim = src2[idx + 1];
+            double tre = src1[idx];
+            double tim = src1[idx + 1];
+            double t = fabs(src0[i]) +
+                       fabs(tre) + fabs(tim) + fabs(cre) + fabs(cim) +
+                       fabs(tre * cre) + fabs(tim * cim) +
+                       fabs(tre * cim) + fabs(tim * cre) +
+                       fabs(tre * cre - tim * cim) +
+                       fabs(tre * cim + tim * cre) +
+                       fabs(cdst[i]) + 1.0;
+            if (!double_near_abs_eps(cdst[i], odst[i], t * 2 *
FLT_EPSILON)) {
+                fprintf(stderr, "%d: %- .12f - %- .12f = % .12g\n",
+                        i, cdst[i], odst[i], cdst[i] - odst[i]);
+                fail();
+                break;
+            }
+        }
+        memcpy(odst, src0, (BUF_SIZE) * sizeof(double));
+        bench_new(odst, src1, src2, LEN);
+    }
+
+    report("dcmul_add");
+}
+
+
+void checkasm_check_afir(void)
+{
+    AudioFIRDSPContext fir = { 0 };
+
+    ff_afir_init(&fir);
+    test_fcmul_add(&fir);
+    test_dcmul_add(&fir);
 }
-- 
2.42.1


flow gg <hlefthleft at gmail.com> 于2023年11月18日周六 11:21写道:

>
>


More information about the ffmpeg-devel mailing list