From 04ee0b66720b245b10c007e192da8fabf997c9bc Mon Sep 17 00:00:00 2001 From: Christophe Favergeon <48906714+christophe0606@users.noreply.github.com> Date: Fri, 24 Jan 2025 08:00:09 +0100 Subject: [PATCH] Github action for testing Neon code New github action Tuning of the tests Update of test CMakeLists.txt --- .github/workflows/runneontest.yaml | 118 +++ Include/dsp/matrix_utils.h | 89 +- Ne10/CMSIS_NE10_fft.neonintrinsic.h | 12 +- Ne10/CMSIS_NE10_fft.neonintrinsic_f16.h | 8 +- Ne10/CMSIS_NE10_fft_common_variables.h | 40 +- ...IS_NE10_fft_generic_float16.neonintrisic.c | 20 +- ...IS_NE10_fft_generic_float32.neonintrisic.c | 20 +- Ne10/NE10_fft_float32.neonintrinsic.c | 8 +- Ne10/NE10_rfft_float16.neonintrinsic.c | 4 +- Ne10/NE10_rfft_float32.neonintrinsic.c | 4 +- README.md | 2 + .../arm_canberra_distance_f16.c | 2 +- Source/DistanceFunctions/arm_dice_distance.c | 2 +- .../DistanceFunctions/arm_hamming_distance.c | 2 +- .../DistanceFunctions/arm_jaccard_distance.c | 2 +- .../arm_kulsinski_distance.c | 2 +- .../arm_rogerstanimoto_distance.c | 2 +- .../arm_sokalmichener_distance.c | 4 +- .../arm_sokalsneath_distance.c | 2 +- Source/DistanceFunctions/arm_yule_distance.c | 2 +- Source/FastMathFunctions/arm_atan2_f16.c | 4 +- Source/FastMathFunctions/arm_vlog_f16.c | 18 +- Source/FilteringFunctions/Config.cmake | 2 + .../arm_biquad_cascade_df2T_f32.c | 4 +- Source/MatrixFunctions/arm_mat_cholesky_f16.c | 2 +- Source/MatrixFunctions/arm_mat_qr_f16.c | 14 +- .../arm_mat_solve_lower_triangular_f16.c | 2 +- .../arm_mat_solve_upper_triangular_f16.c | 2 +- Source/MatrixFunctions/arm_mat_vec_mult_f16.c | 10 +- Source/StatisticsFunctions/arm_absmax_f16.c | 2 +- .../arm_absmax_no_idx_f16.c | 2 +- Source/StatisticsFunctions/arm_absmin_f16.c | 2 +- .../arm_absmin_no_idx_f16.c | 2 +- .../StatisticsFunctions/arm_accumulate_f16.c | 2 +- Source/StatisticsFunctions/arm_mean_f16.c | 2 +- Source/SupportFunctions/arm_barycenter_f16.c | 2 +- Testing/CMakeLists.txt | 108 ++- Testing/FrameworkInclude/Error.h | 21 +- Testing/FrameworkInclude/FPGA.h | 6 +- Testing/FrameworkInclude/Test.h | 12 +- Testing/FrameworkInclude/Timing.h | 1 + Testing/FrameworkSource/FPGA.cpp | 8 +- Testing/PatternGeneration/BIQUAD.py | 9 +- .../BIQUAD/BIQUADF32/AllBiquadCoefs2_f32.txt | 792 +++++++++--------- .../BIQUAD/BIQUADF32/AllBiquadInputs2_f32.txt | 236 +++--- .../BIQUAD/BIQUADF32/AllBiquadRefs2_f32.txt | 260 +++--- .../BIQUADF32/AllBiquadStereoInputs2_f32.txt | 484 +++++------ .../BIQUADF32/AllBiquadStereoRefs2_f32.txt | 524 ++++++------ .../BIQUAD/BIQUADF32/BiquadInput1_f32.txt | 400 ++++----- .../BIQUAD/BIQUADF32/BiquadOutput1_f32.txt | 400 ++++----- Testing/Source/Tests/BIQUADF32.cpp | 25 +- Testing/Source/Tests/BasicTestsF32.cpp | 2 +- Testing/Source/Tests/FastMathF16.cpp | 2 +- Testing/Source/Tests/TransformRF16.cpp | 4 +- Testing/Source/Tests/UnaryTestsF32.cpp | 2 +- Testing/TestScripts/CodeGen.py | 2 +- Testing/processResult.py | 7 +- Testing/testmain.cpp | 2 +- vcpkg-neon-configuration.json | 14 + 59 files changed, 1978 insertions(+), 1760 deletions(-) create mode 100644 .github/workflows/runneontest.yaml create mode 100644 vcpkg-neon-configuration.json diff --git a/.github/workflows/runneontest.yaml b/.github/workflows/runneontest.yaml new file mode 100644 index 000000000..a57ec1ac6 --- /dev/null +++ b/.github/workflows/runneontest.yaml @@ -0,0 +1,118 @@ +name: Neon tests +on: + workflow_dispatch: + pull_request: + branches: [main] + push: + branches: [main] + +permissions: + actions: read + security-events: write + +jobs: + CI_test_run: + runs-on: ubuntu-22.04-arm + + steps: + - name: Checkout + uses: actions/checkout@v4 + + - name: Setup Python 3.10 + uses: actions/setup-python@v5 + with: + python-version: '3.10' + + - name: Install system packages + run: | + sudo add-apt-repository ppa:deadsnakes/ppa + sudo apt-get install libpython3.9 libtinfo5 + sudo apt install build-essential + sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-11 60 --slave /usr/bin/g++ g++ /usr/bin/g++-11 + sudo update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-12 40 --slave /usr/bin/g++ g++ /usr/bin/g++-12 + sudo update-alternatives --set gcc /usr/bin/gcc-12 + + + - name: Activate vcpkg + uses: ARM-software/cmsis-actions/vcpkg@v1 + with: + config: "./vcpkg-neon-configuration.json" + + - name: Prepare framework + run: | + cd Testing + echo "Create missing folders" + mkdir FullBenchmark + mkdir Output + mkdir GeneratedInclude + mkdir GeneratedSource + mkdir GeneratedIncludeBench + mkdir GeneratedSourceBench + mkdir build + + echo "Install missing python packages" + pip install -r requirements.txt + + echo "Preprocess test description" + python preprocess.py -f desc.txt -o Output.pickle + python preprocess.py -f desc_neon.txt -o Output_neon.pickle + python preprocess.py -f desc_f16.txt -o Output_f16.pickle + + echo "Generate missing CPP headers" + python processTests.py -gen . -p Patterns -d Parameters -f Output.pickle -e + python processTests.py -gen . -p Patterns -d Parameters -f Output_neon.pickle -e + python processTests.py -gen . -p Patterns -d Parameters -f Output_f16.pickle -e + + cd build + + cmake -G "Ninja" .. + +# - name: Setup tmate session +# uses: mxschmitt/action-tmate@v3 + + - name: Execute generic tests + run: | + cd Testing/build + + python ../processTests.py -p ../Patterns -d ../Parameters -gen .. -e -f ../Output.pickle + ninja + ./test > result.txt + python ../processResult.py --noerr -e -f ../Output.pickle -r result.txt -html > result.html + + - name: Execute neon specific C tests + run: | + cd Testing/build + + python ../processTests.py -p ../Patterns -d ../Parameters -gen .. -e -f ../Output_neon.pickle + ninja + ./test > result_neon.txt + python ../processResult.py --noerr -e -f ../Output_neon.pickle -r result_neon.txt -html > result_neon.html + + - name: Execute f16 C tests + run: | + cd Testing/build + + python ../processTests.py -p ../Patterns -d ../Parameters -gen .. -e -f ../Output_f16.pickle + ninja + ./test > result_f16.txt + python ../processResult.py --noerr -e -f ../Output_f16.pickle -r result_f16.txt -html > result_f16.html + + - name: Upload test report + uses: actions/upload-artifact@v4 + with: + name: neon-test-report + path: | + Testing/build/result.html + Testing/build/result_neon.html + Testing/build/result_f16.html + + + - name: Check error + run: | + cd Testing/build + + echo "Checking output..." + test "$(grep "FAILED" result.html | wc -l)" -eq 0 + test "$(grep "FAILED" result_neon.html | wc -l)" -eq 0 + test "$(grep "FAILED" result_f16.html | wc -l)" -eq 0 + diff --git a/Include/dsp/matrix_utils.h b/Include/dsp/matrix_utils.h index 79e7f8cf1..c8d0ba3e4 100755 --- a/Include/dsp/matrix_utils.h +++ b/Include/dsp/matrix_utils.h @@ -51,7 +51,7 @@ extern "C" \ for(_w=0;_w < nb; _w++) \ { \ - *data *= CAST v; \ + *data = CAST *data * CAST v; \ data += _numCols; \ } \ } @@ -178,54 +178,63 @@ extern "C" } \ } -#define SCALE_ROW_F16(A,COL,v,i) \ -{ \ +#define SCALE_ROW_F16(A,COL,v,i) \ +{ \ int32_t _w; \ - float16_t *data = (A)->pData; \ + float16_t *data = (A)->pData; \ const int32_t _numCols = (A)->numCols;\ const int32_t nb = _numCols-(COL); \ - \ + \ data += i*_numCols + (COL); \ - \ - for(_w=0;_w < nb; _w++) \ - { \ - *data++ *= (_Float16)v; \ - } \ + \ + _Float16 sum; \ + for(_w=0;_w < nb; _w++) \ + { \ + sum = *data; \ + sum *= (_Float16)v; \ + *data++ = sum; \ + } \ } -#define MAC_ROW_F16(COL,A,i,v,B,j) \ -{ \ - int32_t _w; \ - float16_t *dataA = (A)->pData; \ - float16_t *dataB = (B)->pData; \ - const int32_t _numCols = (A)->numCols; \ - const int32_t nb = _numCols-(COL); \ - \ - dataA += i*_numCols + (COL); \ - dataB += j*_numCols + (COL); \ - \ - for(_w=0;_w < nb; _w++) \ - { \ - *dataA++ += (_Float16)v * (_Float16)*dataB++;\ - } \ +#define MAC_ROW_F16(COL,A,i,v,B,j) \ +{ \ + int32_t _w; \ + float16_t *dataA = (A)->pData; \ + float16_t *dataB = (B)->pData; \ + const int32_t _numCols = (A)->numCols; \ + const int32_t nb = _numCols-(COL); \ + \ + dataA += i*_numCols + (COL); \ + dataB += j*_numCols + (COL); \ + \ + _Float16 sum ; \ + for(_w=0;_w < nb; _w++) \ + { \ + sum = *dataA; \ + sum += (_Float16)v * (_Float16)*dataB++;\ + *dataA++ = sum; \ + } \ } -#define MAS_ROW_F16(COL,A,i,v,B,j) \ -{ \ - int32_t _w; \ - float16_t *dataA = (A)->pData; \ - float16_t *dataB = (B)->pData; \ - const int32_t _numCols = (A)->numCols; \ - const int32_t nb = _numCols-(COL); \ - \ - dataA += i*_numCols + (COL); \ - dataB += j*_numCols + (COL); \ - \ - for(_w=0;_w < nb; _w++) \ - { \ - *dataA++ -= (_Float16)v * (_Float16)*dataB++;\ - } \ +#define MAS_ROW_F16(COL,A,i,v,B,j) \ +{ \ + int32_t _w; \ + float16_t *dataA = (A)->pData; \ + float16_t *dataB = (B)->pData; \ + const int32_t _numCols = (A)->numCols; \ + const int32_t nb = _numCols-(COL); \ + \ + dataA += i*_numCols + (COL); \ + dataB += j*_numCols + (COL); \ + \ + _Float16 sum ; \ + for(_w=0;_w < nb; _w++) \ + { \ + sum = *dataA; \ + sum -= (_Float16)v * (_Float16)*dataB++;\ + *dataA++ = sum; \ + } \ } #endif /*defined(ARM_MATH_MVE_FLOAT16) && !defined(ARM_MATH_AUTOVECTORIZE)*/ diff --git a/Ne10/CMSIS_NE10_fft.neonintrinsic.h b/Ne10/CMSIS_NE10_fft.neonintrinsic.h index 03680c00b..5b8b75ec8 100755 --- a/Ne10/CMSIS_NE10_fft.neonintrinsic.h +++ b/Ne10/CMSIS_NE10_fft.neonintrinsic.h @@ -110,17 +110,17 @@ #define VDUPQ_N_F32(VAR) { VAR, VAR, VAR, VAR } -#define CONST_TW_81 0.70710678 -#define CONST_TW_81N -0.70710678 +#define CONST_TW_81 0.70710678f +#define CONST_TW_81N -0.70710678f -const static float32x4_t Q_TW_81 = VDUPQ_N_F32(CONST_TW_81 ); -const static float32x4_t Q_TW_81N = VDUPQ_N_F32(CONST_TW_81N); +static const float32x4_t Q_TW_81 = VDUPQ_N_F32(CONST_TW_81 ); +static const float32x4_t Q_TW_81N = VDUPQ_N_F32(CONST_TW_81N); #define DIV_TW81 1.4142136f #define DIV_TW81N -1.4142136f -const static float32x4_t DIV_TW81_NEON = VDUPQ_N_F32(DIV_TW81); -const static float32x4_t DIV_TW81N_NEON = VDUPQ_N_F32(DIV_TW81N); +static const float32x4_t DIV_TW81_NEON = VDUPQ_N_F32(DIV_TW81); +static const float32x4_t DIV_TW81N_NEON = VDUPQ_N_F32(DIV_TW81N); #define NE10_RADIX8x4_R2C_NEON_KERNEL_S1(Q_OUT,Q_IN) do { \ Q_OUT ## 0 = vaddq_f32 (Q_IN ## 0, Q_IN ## 4); \ diff --git a/Ne10/CMSIS_NE10_fft.neonintrinsic_f16.h b/Ne10/CMSIS_NE10_fft.neonintrinsic_f16.h index 328734943..d5c92836b 100755 --- a/Ne10/CMSIS_NE10_fft.neonintrinsic_f16.h +++ b/Ne10/CMSIS_NE10_fft.neonintrinsic_f16.h @@ -119,14 +119,14 @@ #define CONST_TW_81 0.70710678f16 #define CONST_TW_81N -0.70710678f16 -const static float16x4_t Q_TW_81 = VDUPQ_N_F16(CONST_TW_81 ); -const static float16x4_t Q_TW_81N = VDUPQ_N_F16(CONST_TW_81N); +static const float16x4_t Q_TW_81 = VDUPQ_N_F16(CONST_TW_81 ); +static const float16x4_t Q_TW_81N = VDUPQ_N_F16(CONST_TW_81N); #define DIV_TW81 1.4142136f16 #define DIV_TW81N -1.4142136f16 -const static float16x4_t DIV_TW81_NEON = VDUPQ_N_F16(DIV_TW81); -const static float16x4_t DIV_TW81N_NEON = VDUPQ_N_F16(DIV_TW81N); +static const float16x4_t DIV_TW81_NEON = VDUPQ_N_F16(DIV_TW81); +static const float16x4_t DIV_TW81N_NEON = VDUPQ_N_F16(DIV_TW81N); #define NE10_RADIX8x4_R2C_NEON_KERNEL_S1(Q_OUT,Q_IN) do { \ Q_OUT ## 0 = vadd_f16 (Q_IN ## 0, Q_IN ## 4); \ diff --git a/Ne10/CMSIS_NE10_fft_common_variables.h b/Ne10/CMSIS_NE10_fft_common_variables.h index d105347d6..375d2777c 100755 --- a/Ne10/CMSIS_NE10_fft_common_variables.h +++ b/Ne10/CMSIS_NE10_fft_common_variables.h @@ -40,60 +40,60 @@ /////////////////////////// /* Twiddles used in Radix-8 FFT */ -const static ne10_float32_t TW_81_F32 = 0.70710678; // sqrt (2) / 2 -const static ne10_float32_t TW_81N_F32 = -0.70710678; // - TW_81_F32 +static const ne10_float32_t TW_81_F32 = 0.70710678f; // sqrt (2) / 2 +static const ne10_float32_t TW_81N_F32 = -0.70710678f; // - TW_81_F32 /* Twiddles used in Radix-5 FFT */ -const static ne10_fft_cpx_float32_t TW_5A_F32 = +static const ne10_fft_cpx_float32_t TW_5A_F32 = { - 0.309016994374947, // cos (2 * pi / 5) - -0.951056516295154 // - sin (2 * pi / 5) + 0.309016994374947f, // cos (2 * pi / 5) + -0.951056516295154f // - sin (2 * pi / 5) }; -const static ne10_fft_cpx_int32_t TW_5A_S32 = +static const ne10_fft_cpx_int32_t TW_5A_S32 = { 663608942, // round (TW_5A_F32.r * 2^31) -2042378317 // round (TW_5A_F32.i * 2^31) }; -const static ne10_fft_cpx_float32_t TW_5B_F32 = +static const ne10_fft_cpx_float32_t TW_5B_F32 = { - -0.809016994374947, // cos (4 * pi / 5) - -0.587785252292473 // - sin (4 * pi / 5) + -0.809016994374947f, // cos (4 * pi / 5) + -0.587785252292473f // - sin (4 * pi / 5) }; -const static ne10_fft_cpx_int32_t TW_5B_S32 = +static const ne10_fft_cpx_int32_t TW_5B_S32 = { -1737350766, // round (TW_5B_F32.r * 2^31) -1262259218 // round (TW_5B_F32.i * 2^31) }; /* Twiddles used in Radix-3 FFT */ -const static ne10_float32_t TW_3I_F32 = 0.866025403784439; // sqrt (3) / 2 -const static ne10_float32_t TW_3IN_F32 = - 0.866025403784439; // - TW_3IN_F32 -const static ne10_int32_t TW_3I_S32 = 1859775393; // round (TW_3I_F32 * 2^31) -const static ne10_int32_t TW_3IN_S32 = -1859775393; // round (TW_3IN_F32 * 2^31) +static const ne10_float32_t TW_3I_F32 = 0.866025403784439f; // sqrt (3) / 2 +static const ne10_float32_t TW_3IN_F32 = - 0.866025403784439f; // - TW_3IN_F32 +static const ne10_int32_t TW_3I_S32 = 1859775393; // round (TW_3I_F32 * 2^31) +static const ne10_int32_t TW_3IN_S32 = -1859775393; // round (TW_3IN_F32 * 2^31) #if defined(ARM_MATH_NEON_FLOAT16) && defined(ARM_FLOAT16_SUPPORTED) /* Twiddles used in Radix-8 FFT */ -const static ne10_float16_t TW_81_F16 = 0.70710678f16; // sqrt (2) / 2 -const static ne10_float16_t TW_81N_F16 = -0.70710678f16; // - TW_81_F32 +static const ne10_float16_t TW_81_F16 = 0.70710678f16; // sqrt (2) / 2 +static const ne10_float16_t TW_81N_F16 = -0.70710678f16; // - TW_81_F32 /* Twiddles used in Radix-5 FFT */ -const static ne10_fft_cpx_float16_t TW_5A_F16 = +static const ne10_fft_cpx_float16_t TW_5A_F16 = { 0.309016994374947f16, // cos (2 * pi / 5) -0.951056516295154f16 // - sin (2 * pi / 5) }; -const static ne10_fft_cpx_float16_t TW_5B_F16 = +static const ne10_fft_cpx_float16_t TW_5B_F16 = { -0.809016994374947f16, // cos (4 * pi / 5) -0.587785252292473f16 // - sin (4 * pi / 5) }; /* Twiddles used in Radix-3 FFT */ -const static ne10_float16_t TW_3I_F16 = 0.866025403784439f16; // sqrt (3) / 2 -const static ne10_float16_t TW_3IN_F16 = - 0.866025403784439f16; // - TW_3IN_F32 +static const ne10_float16_t TW_3I_F16 = 0.866025403784439f16; // sqrt (3) / 2 +static const ne10_float16_t TW_3IN_F16 = - 0.866025403784439f16; // - TW_3IN_F32 #endif #endif // NE10_FFT_COMMON_VARIBLES_H diff --git a/Ne10/CMSIS_NE10_fft_generic_float16.neonintrisic.c b/Ne10/CMSIS_NE10_fft_generic_float16.neonintrisic.c index 6824912de..c2f702f98 100755 --- a/Ne10/CMSIS_NE10_fft_generic_float16.neonintrisic.c +++ b/Ne10/CMSIS_NE10_fft_generic_float16.neonintrisic.c @@ -345,12 +345,12 @@ static inline void NE10_FFT8_FUC_NEON_F16 (CPLX out[8], const CPLX in[8]) { CPLX s[8]; - const static ne10_fft_cpx_float16_t TW_8[4] = + static const ne10_fft_cpx_float16_t TW_8[4] = { - { 1.00000, 0.00000 }, - { 0.70711, -0.70711 }, - { 0.00000, -1.00000 }, - { -0.70711, -0.70711 }, + { 1.00000f16, 0.00000f16 }, + { 0.70711f16, -0.70711f16 }, + { 0.00000f16, -1.00000f16 }, + { -0.70711f16, -0.70711f16 }, }; // STAGE - 1 @@ -430,7 +430,7 @@ static void ne10_radix_2_butterfly_float16_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25f16 / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ @@ -509,7 +509,7 @@ static void ne10_radix_4_butterfly_float16_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25f16 / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ @@ -593,7 +593,7 @@ static void ne10_radix_3_butterfly_float16_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25f16 / nfft); \ const float16x4_t TW_3IN_NEON_F16 = vdup_n_f16 (TW_3IN_F16); \ const float16x4_t HALF_NEON_F16 = vdup_n_f16 (0.5f16); \ \ @@ -693,7 +693,7 @@ static void ne10_radix_5_butterfly_float16_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25f16 / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ @@ -815,7 +815,7 @@ static void ne10_radix_8_butterfly_float16_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F16 (0.25f16 / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ diff --git a/Ne10/CMSIS_NE10_fft_generic_float32.neonintrisic.c b/Ne10/CMSIS_NE10_fft_generic_float32.neonintrisic.c index 165c5e7e6..d42680a24 100755 --- a/Ne10/CMSIS_NE10_fft_generic_float32.neonintrisic.c +++ b/Ne10/CMSIS_NE10_fft_generic_float32.neonintrisic.c @@ -429,12 +429,12 @@ static inline void NE10_FFT8_FUC_NEON_F32 (CPLX out[8], const CPLX in[8]) { CPLX s[8]; - const static ne10_fft_cpx_float32_t TW_8[4] = + static const ne10_fft_cpx_float32_t TW_8[4] = { - { 1.00000, 0.00000 }, - { 0.70711, -0.70711 }, - { 0.00000, -1.00000 }, - { -0.70711, -0.70711 }, + { 1.00000f, 0.00000f }, + { 0.70711f, -0.70711f }, + { 0.00000f, -1.00000f }, + { -0.70711f, -0.70711f }, }; // STAGE - 1 @@ -514,7 +514,7 @@ static void ne10_radix_2_butterfly_float32_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25f / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ @@ -593,7 +593,7 @@ static void ne10_radix_4_butterfly_float32_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25f / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ @@ -677,7 +677,7 @@ static void ne10_radix_3_butterfly_float32_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25f / nfft); \ const float32x4_t TW_3IN_NEON_F32 = vdupq_n_f32 (TW_3IN_F32); \ const float32x4_t HALF_NEON_F32 = vdupq_n_f32 (0.5f); \ \ @@ -777,7 +777,7 @@ static void ne10_radix_5_butterfly_float32_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25f / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ @@ -899,7 +899,7 @@ static void ne10_radix_8_butterfly_float32_neon_##ISFIRSTSTAGE##_##ISINVERSE##_# ne10_int32_t f_count; \ ne10_int32_t m_count; \ \ - const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25 / nfft); \ + const REAL one_by_fft_neon = NE10_REAL_DUP_NEON_F32 (0.25f / nfft); \ \ for (f_count = fstride; f_count > 0; f_count--) \ { \ diff --git a/Ne10/NE10_fft_float32.neonintrinsic.c b/Ne10/NE10_fft_float32.neonintrinsic.c index b22134d1c..776e75b69 100644 --- a/Ne10/NE10_fft_float32.neonintrinsic.c +++ b/Ne10/NE10_fft_float32.neonintrinsic.c @@ -422,8 +422,8 @@ __STATIC_INLINE void ne10_radix8x4_neon (ne10_fft_cpx_float32_t *out, ne10_int32_t src_step = stride << 1; // ne10_fft_cpx_float32_t -> float32_t offset const float32_t *p_src = (const float32_t *) in; float32_t *p_dst = (float32_t *) out; - const ne10_float32_t TW_81 = 0.70710678; - const ne10_float32_t TW_81N = -0.70710678; + const ne10_float32_t TW_81 = 0.70710678f; + const ne10_float32_t TW_81N = -0.70710678f; CMPLX_VEC_F32 q2_in0, q2_in1, q2_in2, q2_in3, q2_in4, q2_in5, q2_in6, q2_in7; float32x4_t q_sin0_r, q_sin0_i, q_sin1_r, q_sin1_i, q_sin2_r, q_sin2_i, q_sin3_r, q_sin3_i; @@ -759,8 +759,8 @@ __STATIC_INLINE void ne10_radix8x4_inverse_neon (ne10_fft_cpx_float32_t *out, ne10_int32_t src_step = stride << 1; const float32_t *p_src = (const float32_t *) in; float32_t *p_dst = (float32_t *) out; - const ne10_float32_t TW_81 = 0.70710678; - const ne10_float32_t TW_81N = -0.70710678; + const ne10_float32_t TW_81 = 0.70710678f; + const ne10_float32_t TW_81N = -0.70710678f; CMPLX_VEC_F32 q2_in0, q2_in1, q2_in2, q2_in3, q2_in4, q2_in5, q2_in6, q2_in7; float32x4_t q_sin0_r, q_sin0_i, q_sin1_r, q_sin1_i, q_sin2_r, q_sin2_i, q_sin3_r, q_sin3_i; diff --git a/Ne10/NE10_rfft_float16.neonintrinsic.c b/Ne10/NE10_rfft_float16.neonintrinsic.c index c74aa5656..8193d41a1 100755 --- a/Ne10/NE10_rfft_float16.neonintrinsic.c +++ b/Ne10/NE10_rfft_float16.neonintrinsic.c @@ -1119,7 +1119,7 @@ static void arm_ne10_radix4_c2r_with_twiddles_first_stage_second_butterfly ( NE10_INV_BUTTERFLY_TMP( 0,1, 1,3, 1,0, 3,2); - q_in3[3] *= - 1.0f; + q_in3[3] = (_Float16)q_in3[3] * (-(_Float16)1.0f16); NE10_INV_BUTTERFLY_TMP( 1,1, 0,3, 3,3, 1,1); @@ -1132,7 +1132,7 @@ static void arm_ne10_radix4_c2r_with_twiddles_first_stage_second_butterfly ( NE10_INV_BUTTERFLY_TMP( 2,1, 3,3, 1,2, 3,0); - q_in3[1] *= - 1.0f; + q_in3[1] = (_Float16)q_in3[1] * (-(_Float16)1.0f16); NE10_INV_BUTTERFLY_TMP( 3,1, 2,3, 3,1, 1,3); #undef NE10_INV_BUTTERFLY_TMP diff --git a/Ne10/NE10_rfft_float32.neonintrinsic.c b/Ne10/NE10_rfft_float32.neonintrinsic.c index 30e191ae0..af27353c2 100755 --- a/Ne10/NE10_rfft_float32.neonintrinsic.c +++ b/Ne10/NE10_rfft_float32.neonintrinsic.c @@ -109,7 +109,7 @@ static void arm_ne10_radix8x4_c2r_neon ( NE10_DECLARE_8(float32x4_t,q_out); #if defined(CMSIS_NE10_DSP_RIFFT_SCALING) - const ne10_float32_t one_by_N = 0.25 / nfft; + const ne10_float32_t one_by_N = 0.25f / nfft; const float32x4_t one_by_N_neon = vdupq_n_f32(one_by_N); #endif @@ -193,7 +193,7 @@ static void arm_ne10_radix4x4_c2r_neon ( float32x4_t *Fout_neon = (float32x4_t*) Fout; #if defined(CMSIS_NE10_DSP_RIFFT_SCALING) - const ne10_float32_t one_by_N = 0.25 / nfft; + const ne10_float32_t one_by_N = 0.25f / nfft; const float32x4_t one_by_N_neon = vdupq_n_f32(one_by_N); #endif for (f_count = 0; f_count < fstride; f_count ++) diff --git a/README.md b/README.md index 291d19aaa..0d4d0dbee 100755 --- a/README.md +++ b/README.md @@ -6,6 +6,8 @@ [![CPP Tests](https://github.com/ARM-software/CMSIS-DSP/actions/workflows/runcpptest.yaml/badge.svg)](https://github.com/ARM-software/CMSIS-DSP/actions/workflows/runcpptest.yaml) +[![Neon Tests](https://github.com/ARM-software/CMSIS-DSP/actions/workflows/runneontest.yaml/badge.svg)](https://github.com/ARM-software/CMSIS-DSP/actions/workflows/runneontest.yaml) + ## About CMSIS-DSP is an optimized compute library for embedded systems (DSP is in the name for legacy reasons). diff --git a/Source/DistanceFunctions/arm_canberra_distance_f16.c b/Source/DistanceFunctions/arm_canberra_distance_f16.c index 632ee1bfe..5478141bd 100755 --- a/Source/DistanceFunctions/arm_canberra_distance_f16.c +++ b/Source/DistanceFunctions/arm_canberra_distance_f16.c @@ -150,7 +150,7 @@ ARM_DSP_ATTRIBUTE float16_t arm_canberra_distance_f16(const float16_t *pA,const tmpA = *pA++; tmpB = *pB++; - diff = fabsf((float32_t)((_Float16)tmpA - (_Float16)tmpB)); + diff = (float16_t)fabsf((float32_t)((_Float16)tmpA - (_Float16)tmpB)); sum = (_Float16)fabsf((float32_t)tmpA) + (_Float16)fabsf((float32_t)tmpB); if (((_Float16)tmpA != 0.0f16) || ((_Float16)tmpB != 0.0f16)) { diff --git a/Source/DistanceFunctions/arm_dice_distance.c b/Source/DistanceFunctions/arm_dice_distance.c index e3ca16012..a4c058f87 100755 --- a/Source/DistanceFunctions/arm_dice_distance.c +++ b/Source/DistanceFunctions/arm_dice_distance.c @@ -79,7 +79,7 @@ ARM_DSP_ATTRIBUTE float32_t arm_dice_distance(const uint32_t *pA, const uint32_t arm_boolean_distance_TT_TF_FT(pA, pB, numberOfBools, &ctt, &ctf, &cft); - return(1.0*(ctf + cft) / (2.0*ctt + cft + ctf)); + return(1.0f*(ctf + cft) / (2.0f*ctt + cft + ctf)); } diff --git a/Source/DistanceFunctions/arm_hamming_distance.c b/Source/DistanceFunctions/arm_hamming_distance.c index 4280fef0f..6c57b391e 100755 --- a/Source/DistanceFunctions/arm_hamming_distance.c +++ b/Source/DistanceFunctions/arm_hamming_distance.c @@ -61,7 +61,7 @@ ARM_DSP_ATTRIBUTE float32_t arm_hamming_distance(const uint32_t *pA, const uint3 arm_boolean_distance_TF_FT(pA, pB, numberOfBools, &ctf, &cft); - return(1.0*(ctf + cft) / numberOfBools); + return(1.0f*(ctf + cft) / numberOfBools); } diff --git a/Source/DistanceFunctions/arm_jaccard_distance.c b/Source/DistanceFunctions/arm_jaccard_distance.c index fd6f7bbb0..656fd2496 100755 --- a/Source/DistanceFunctions/arm_jaccard_distance.c +++ b/Source/DistanceFunctions/arm_jaccard_distance.c @@ -63,7 +63,7 @@ ARM_DSP_ATTRIBUTE float32_t arm_jaccard_distance(const uint32_t *pA, const uint3 arm_boolean_distance_TT_TF_FT(pA, pB, numberOfBools, &ctt, &ctf, &cft); - return(1.0*(ctf + cft) / (ctt + cft + ctf)); + return(1.0f*(ctf + cft) / (ctt + cft + ctf)); } diff --git a/Source/DistanceFunctions/arm_kulsinski_distance.c b/Source/DistanceFunctions/arm_kulsinski_distance.c index c88834e9a..265de0911 100755 --- a/Source/DistanceFunctions/arm_kulsinski_distance.c +++ b/Source/DistanceFunctions/arm_kulsinski_distance.c @@ -64,7 +64,7 @@ ARM_DSP_ATTRIBUTE float32_t arm_kulsinski_distance(const uint32_t *pA, const uin arm_boolean_distance_TT_TF_FT(pA, pB, numberOfBools, &ctt, &ctf, &cft); - return(1.0*(ctf + cft - ctt + numberOfBools) / (cft + ctf + numberOfBools)); + return(1.0f*(ctf + cft - ctt + numberOfBools) / (cft + ctf + numberOfBools)); } diff --git a/Source/DistanceFunctions/arm_rogerstanimoto_distance.c b/Source/DistanceFunctions/arm_rogerstanimoto_distance.c index 3f30148e2..0b2fbacb5 100755 --- a/Source/DistanceFunctions/arm_rogerstanimoto_distance.c +++ b/Source/DistanceFunctions/arm_rogerstanimoto_distance.c @@ -66,7 +66,7 @@ ARM_DSP_ATTRIBUTE float32_t arm_rogerstanimoto_distance(const uint32_t *pA, cons r = 2*(ctf + cft); - return(1.0*r / (r + ctt + cff)); + return(1.0f*r / (r + ctt + cff)); } diff --git a/Source/DistanceFunctions/arm_sokalmichener_distance.c b/Source/DistanceFunctions/arm_sokalmichener_distance.c index 4abd0291c..c87ac4f0a 100755 --- a/Source/DistanceFunctions/arm_sokalmichener_distance.c +++ b/Source/DistanceFunctions/arm_sokalmichener_distance.c @@ -64,8 +64,8 @@ ARM_DSP_ATTRIBUTE float32_t arm_sokalmichener_distance(const uint32_t *pA, const arm_boolean_distance_TT_FF_TF_FT(pA, pB, numberOfBools, &ctt, &cff, &ctf, &cft); - r = 2.0*(ctf + cft); - s = 1.0*(cff + ctt); + r = 2.0f*(ctf + cft); + s = 1.0f*(cff + ctt); return(r / (s+r)); } diff --git a/Source/DistanceFunctions/arm_sokalsneath_distance.c b/Source/DistanceFunctions/arm_sokalsneath_distance.c index 6a86c591c..fb8c0fbce 100755 --- a/Source/DistanceFunctions/arm_sokalsneath_distance.c +++ b/Source/DistanceFunctions/arm_sokalsneath_distance.c @@ -63,7 +63,7 @@ ARM_DSP_ATTRIBUTE float32_t arm_sokalsneath_distance(const uint32_t *pA, const u arm_boolean_distance_TT_TF_FT(pA, pB, numberOfBools, &ctt, &ctf, &cft); - r = 2.0*(ctf + cft); + r = 2.0f*(ctf + cft); return(r / (r + ctt)); } diff --git a/Source/DistanceFunctions/arm_yule_distance.c b/Source/DistanceFunctions/arm_yule_distance.c index c4067035c..84e94582d 100755 --- a/Source/DistanceFunctions/arm_yule_distance.c +++ b/Source/DistanceFunctions/arm_yule_distance.c @@ -65,7 +65,7 @@ ARM_DSP_ATTRIBUTE float32_t arm_yule_distance(const uint32_t *pA, const uint32_t r = 2*(ctf * cft); - return(1.0*r / (r/2.0 + ctt * cff)); + return(1.0f*r / (r/2.0f + ctt * cff)); } diff --git a/Source/FastMathFunctions/arm_atan2_f16.c b/Source/FastMathFunctions/arm_atan2_f16.c index 4f0df68b1..6c5e93a07 100755 --- a/Source/FastMathFunctions/arm_atan2_f16.c +++ b/Source/FastMathFunctions/arm_atan2_f16.c @@ -67,7 +67,7 @@ __STATIC_FORCEINLINE float16_t arm_atan_limited_f16(float16_t x) __STATIC_FORCEINLINE float16_t arm_atan_f16(float16_t x) { int sign=0; - float16_t res=0.0f16; + _Float16 res=0.0f16; if ((_Float16)x < 0.0f16) { @@ -91,7 +91,7 @@ __STATIC_FORCEINLINE float16_t arm_atan_f16(float16_t x) res = -(_Float16)res; } - return(res); + return((float16_t)res); } /** diff --git a/Source/FastMathFunctions/arm_vlog_f16.c b/Source/FastMathFunctions/arm_vlog_f16.c index 56bcfcf25..fe8fd105e 100755 --- a/Source/FastMathFunctions/arm_vlog_f16.c +++ b/Source/FastMathFunctions/arm_vlog_f16.c @@ -61,15 +61,15 @@ coefs = Chop@Flatten[CoefficientList[lut, x]]; */ static float16_t lut_logf16[NB_LUT_LOGF16]={ - 0,0.125,-0.00781197,0.00063974,0.117783, - 0.111111,-0.00617212,0.000447935,0.223144, - 0.1,-0.00499952,0.000327193,0.318454,0.0909091, - -0.00413191,0.000246234,0.405465,0.0833333, - -0.00347199,0.000189928,0.485508,0.0769231, - -0.00295841,0.00014956,0.559616,0.0714286, - -0.0025509,0.000119868,0.628609,0.0666667, - -0.00222213,0.0000975436,0.693147, - 0.0625,-0.00195305,0.0000804357}; + 0,(float16_t)0.125,(float16_t)-0.00781197,(float16_t)0.00063974,(float16_t)0.117783,(float16_t) + 0.111111,(float16_t)-0.00617212,(float16_t)0.000447935,(float16_t)0.223144,(float16_t) + 0.1,(float16_t)-0.00499952,(float16_t)0.000327193,(float16_t)0.318454,(float16_t)0.0909091,(float16_t) + -0.00413191,(float16_t)0.000246234,(float16_t)0.405465,(float16_t)0.0833333,(float16_t) + -0.00347199,(float16_t)0.000189928,(float16_t)0.485508,(float16_t)0.0769231,(float16_t) + -0.00295841,(float16_t)0.00014956,(float16_t)0.559616,(float16_t)0.0714286,(float16_t) + -0.0025509,(float16_t)0.000119868,(float16_t)0.628609,(float16_t)0.0666667,(float16_t) + -0.00222213,(float16_t)0.0000975436,(float16_t)0.693147,(float16_t) + 0.0625,(float16_t)-0.00195305,(float16_t)0.0000804357}; static float16_t logf16_scalar(float16_t x) diff --git a/Source/FilteringFunctions/Config.cmake b/Source/FilteringFunctions/Config.cmake index fc175f247..bf4c62aac 100644 --- a/Source/FilteringFunctions/Config.cmake +++ b/Source/FilteringFunctions/Config.cmake @@ -50,10 +50,12 @@ target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_correlate_opt_q7.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_correlate_q15.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_correlate_q31.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_correlate_q7.c) +target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_f64.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_f32.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_f64.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_fast_q15.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_fast_q31.c) +target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_init_f64.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_init_f32.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_init_f64.c) target_sources(CMSISDSP PRIVATE FilteringFunctions/arm_fir_decimate_init_q15.c) diff --git a/Source/FilteringFunctions/arm_biquad_cascade_df2T_f32.c b/Source/FilteringFunctions/arm_biquad_cascade_df2T_f32.c index 87d06271b..08dd5a171 100644 --- a/Source/FilteringFunctions/arm_biquad_cascade_df2T_f32.c +++ b/Source/FilteringFunctions/arm_biquad_cascade_df2T_f32.c @@ -179,7 +179,9 @@ ARM_DSP_ATTRIBUTE void arm_biquad_cascade_df2T_f32( while (stage > 0U); } #else -#if defined(ARM_MATH_NEON) +/* The Neon version is not passing the test so is disabled +until the problem is corrected. Issue #186 */ +#if 0 //defined(ARM_MATH_NEON) ARM_DSP_ATTRIBUTE void arm_biquad_cascade_df2T_f32( const arm_biquad_cascade_df2T_instance_f32 * S, diff --git a/Source/MatrixFunctions/arm_mat_cholesky_f16.c b/Source/MatrixFunctions/arm_mat_cholesky_f16.c index dc2aa1748..6b31b8673 100755 --- a/Source/MatrixFunctions/arm_mat_cholesky_f16.c +++ b/Source/MatrixFunctions/arm_mat_cholesky_f16.c @@ -234,7 +234,7 @@ ARM_DSP_ATTRIBUTE arm_status arm_mat_cholesky_f16( /* The division is done in float32 for accuracy reason and because doing it in f16 would not have any impact on the performances. */ - invSqrtVj = 1.0f/sqrtf((float32_t)pG[i * n + i]); + invSqrtVj = (float16_t)(1.0f/sqrtf((float32_t)pG[i * n + i])); SCALE_COL_F16(pDst,i,invSqrtVj,i); } diff --git a/Source/MatrixFunctions/arm_mat_qr_f16.c b/Source/MatrixFunctions/arm_mat_qr_f16.c index eb68a76ea..4d8be11db 100644 --- a/Source/MatrixFunctions/arm_mat_qr_f16.c +++ b/Source/MatrixFunctions/arm_mat_qr_f16.c @@ -603,7 +603,7 @@ ARM_DSP_ATTRIBUTE arm_status arm_mat_qr_f16( k=1; while(blkCnt > 0) { - float16_t sum; + _Float16 sum; for(j=0;jnumCols-col; j++) { @@ -629,9 +629,12 @@ ARM_DSP_ATTRIBUTE arm_status arm_mat_qr_f16( pa = pa0; for(;knumRows-col; k++) { + _Float16 sum; for(j=0;jnumCols-col; j++) { - *pdst++ += (_Float16)*pv * (_Float16)*pa++; + sum = *pdst; + sum += (_Float16)*pv * (_Float16)*pa++; + *pdst++ = sum ; } pa += col; pv++; @@ -713,7 +716,7 @@ ARM_DSP_ATTRIBUTE arm_status arm_mat_qr_f16( k=1; while(blkCnt > 0) { - float16_t sum; + _Float16 sum; for(j=0;jnumRows-pos; j++) { @@ -739,9 +742,12 @@ ARM_DSP_ATTRIBUTE arm_status arm_mat_qr_f16( pa = pa0; for(;knumRows-pos; k++) { + _Float16 sum; for(j=0;jnumRows-pos; j++) { - *pdst++ += (_Float16)*pv * (_Float16)*pa++; + sum = *pdst; + sum += (_Float16)*pv * (_Float16)*pa++; + *pdst++ = sum ; } pa += pos; pv++; diff --git a/Source/MatrixFunctions/arm_mat_solve_lower_triangular_f16.c b/Source/MatrixFunctions/arm_mat_solve_lower_triangular_f16.c index 8dafc143c..ffddaa7a0 100755 --- a/Source/MatrixFunctions/arm_mat_solve_lower_triangular_f16.c +++ b/Source/MatrixFunctions/arm_mat_solve_lower_triangular_f16.c @@ -203,7 +203,7 @@ { lt_row = &pLT[n*i]; - float16_t tmp=a_col[i * cols]; + _Float16 tmp=a_col[i * cols]; for(k=0; k < i; k++) { diff --git a/Source/MatrixFunctions/arm_mat_solve_upper_triangular_f16.c b/Source/MatrixFunctions/arm_mat_solve_upper_triangular_f16.c index 332280f09..6feb00d3c 100755 --- a/Source/MatrixFunctions/arm_mat_solve_upper_triangular_f16.c +++ b/Source/MatrixFunctions/arm_mat_solve_upper_triangular_f16.c @@ -193,7 +193,7 @@ arm_status status; /* status of matrix inverse */ { ut_row = &pUT[n*i]; - float16_t tmp=a_col[i * cols]; + _Float16 tmp=a_col[i * cols]; for(k=n-1; k > i; k--) { diff --git a/Source/MatrixFunctions/arm_mat_vec_mult_f16.c b/Source/MatrixFunctions/arm_mat_vec_mult_f16.c index be446f1a4..d2569483e 100755 --- a/Source/MatrixFunctions/arm_mat_vec_mult_f16.c +++ b/Source/MatrixFunctions/arm_mat_vec_mult_f16.c @@ -311,10 +311,10 @@ ARM_DSP_ATTRIBUTE void arm_mat_vec_mult_f16(const arm_matrix_instance_f16 *pSrcM pInVec = pVec; /* Initialize accumulators */ - float16_t sum1 = 0.0f16; - float16_t sum2 = 0.0f16; - float16_t sum3 = 0.0f16; - float16_t sum4 = 0.0f16; + _Float16 sum1 = 0.0f16; + _Float16 sum2 = 0.0f16; + _Float16 sum3 = 0.0f16; + _Float16 sum4 = 0.0f16; /* Loop unrolling: process 2 columns per iteration */ colCnt = numCols; @@ -360,7 +360,7 @@ ARM_DSP_ATTRIBUTE void arm_mat_vec_mult_f16(const arm_matrix_instance_f16 *pSrcM row = numRows & 3u; while (row > 0) { - float16_t sum = 0.0f16; + _Float16 sum = 0.0f16; pInVec = pVec; pInA1 = pSrcA + i; diff --git a/Source/StatisticsFunctions/arm_absmax_f16.c b/Source/StatisticsFunctions/arm_absmax_f16.c index d5a9e8ddf..6237553d0 100755 --- a/Source/StatisticsFunctions/arm_absmax_f16.c +++ b/Source/StatisticsFunctions/arm_absmax_f16.c @@ -143,7 +143,7 @@ ARM_DSP_ATTRIBUTE void arm_absmax_f16( float16_t * pResult, uint32_t * pIndex) { - float16_t cur_absmax, out; /* Temporary variables to store the output value. */\ + _Float16 cur_absmax, out; /* Temporary variables to store the output value. */\ uint32_t blkCnt, outIndex; /* Loop counter */ \ uint32_t index; /* index of maximum value */ \ \ diff --git a/Source/StatisticsFunctions/arm_absmax_no_idx_f16.c b/Source/StatisticsFunctions/arm_absmax_no_idx_f16.c index 482ee6496..a7409abcb 100755 --- a/Source/StatisticsFunctions/arm_absmax_no_idx_f16.c +++ b/Source/StatisticsFunctions/arm_absmax_no_idx_f16.c @@ -111,7 +111,7 @@ ARM_DSP_ATTRIBUTE void arm_absmax_no_idx_f16( uint32_t blockSize, float16_t * pResult) { - float16_t cur_absmax, out; /* Temporary variables to store the output value. */\ + _Float16 cur_absmax, out; /* Temporary variables to store the output value. */\ uint32_t blkCnt; /* Loop counter */ \ \ \ diff --git a/Source/StatisticsFunctions/arm_absmin_f16.c b/Source/StatisticsFunctions/arm_absmin_f16.c index 10d6f2efc..72c53e96d 100755 --- a/Source/StatisticsFunctions/arm_absmin_f16.c +++ b/Source/StatisticsFunctions/arm_absmin_f16.c @@ -145,7 +145,7 @@ ARM_DSP_ATTRIBUTE void arm_absmin_f16( float16_t * pResult, uint32_t * pIndex) { - float16_t cur_absmin, out; /* Temporary variables to store the output value. */\ + _Float16 cur_absmin, out; /* Temporary variables to store the output value. */\ uint32_t blkCnt, outIndex; /* Loop counter */ \ uint32_t index; /* index of maximum value */ \ \ diff --git a/Source/StatisticsFunctions/arm_absmin_no_idx_f16.c b/Source/StatisticsFunctions/arm_absmin_no_idx_f16.c index 3f9bac14b..5e944dbb1 100755 --- a/Source/StatisticsFunctions/arm_absmin_no_idx_f16.c +++ b/Source/StatisticsFunctions/arm_absmin_no_idx_f16.c @@ -113,7 +113,7 @@ ARM_DSP_ATTRIBUTE void arm_absmin_no_idx_f16( uint32_t blockSize, float16_t * pResult) { - float16_t cur_absmin, out; /* Temporary variables to store the output value. */\ + _Float16 cur_absmin, out; /* Temporary variables to store the output value. */\ uint32_t blkCnt; /* Loop counter */ \ \ \ diff --git a/Source/StatisticsFunctions/arm_accumulate_f16.c b/Source/StatisticsFunctions/arm_accumulate_f16.c index d95a81541..007f68e50 100755 --- a/Source/StatisticsFunctions/arm_accumulate_f16.c +++ b/Source/StatisticsFunctions/arm_accumulate_f16.c @@ -66,7 +66,7 @@ ARM_DSP_ATTRIBUTE void arm_accumulate_f16( float16_t * pResult) { uint32_t blkCnt; /* Loop counter */ - float16_t sum = 0.0f16; /* Temporary result storage */ + _Float16 sum = 0.0f16; /* Temporary result storage */ #if defined (ARM_MATH_LOOPUNROLL) && !defined(ARM_MATH_AUTOVECTORIZE) diff --git a/Source/StatisticsFunctions/arm_mean_f16.c b/Source/StatisticsFunctions/arm_mean_f16.c index 32da38650..3c47ec63e 100755 --- a/Source/StatisticsFunctions/arm_mean_f16.c +++ b/Source/StatisticsFunctions/arm_mean_f16.c @@ -96,7 +96,7 @@ ARM_DSP_ATTRIBUTE void arm_mean_f16( float16_t * pResult) { uint32_t blkCnt; /* Loop counter */ - float16_t sum = 0.0f; /* Temporary result storage */ + _Float16 sum = 0.0f; /* Temporary result storage */ #if defined (ARM_MATH_LOOPUNROLL) && !defined(ARM_MATH_AUTOVECTORIZE) diff --git a/Source/SupportFunctions/arm_barycenter_f16.c b/Source/SupportFunctions/arm_barycenter_f16.c index b666cca1a..7d422de46 100755 --- a/Source/SupportFunctions/arm_barycenter_f16.c +++ b/Source/SupportFunctions/arm_barycenter_f16.c @@ -212,7 +212,7 @@ ARM_DSP_ATTRIBUTE void arm_barycenter_f16(const float16_t *in, const float16_t * const float16_t *pIn,*pW; float16_t *pOut; uint32_t blkCntVector,blkCntSample; - float16_t accum, w; + _Float16 accum, w; blkCntVector = nbVectors; blkCntSample = vecDim; diff --git a/Testing/CMakeLists.txt b/Testing/CMakeLists.txt index 1ffefbb96..4d9c0a8f4 100755 --- a/Testing/CMakeLists.txt +++ b/Testing/CMakeLists.txt @@ -14,9 +14,9 @@ option(NOAUTOVEC "Disable auto-vectorization" OFF) option(HOST "" ON) -option(NEON "" OFF) +option(NEON "" ON) option(NEONEXPERIMENTAL "" OFF) -option(DISABLEFLOAT16 "" ON) +option(DISABLEFLOAT16 "" OFF) add_subdirectory(../Source bin_dsp) @@ -157,47 +157,77 @@ target_include_directories(test PUBLIC FrameworkInclude target_compile_definitions(test PUBLIC EMBEDDED NOTIMING) -target_compile_options(test PUBLIC -Wsign-compare - -Wdouble-promotion - -DNDEBUG - -Wall - -Wextra - -O3 - -Wno-packed - -Wno-missing-variable-declarations - -Wno-missing-noreturn - -Wno-sign-conversion - -Wno-nonportable-include-path - -Wno-reserved-id-macro - -Wno-unused-macros - -Wno-documentation-unknown-command - -Wno-documentation - -Wno-parentheses-equality - -Wno-reserved-identifier +target_compile_options(test PUBLIC -Wsign-compare + -Wdouble-promotion + -DNDEBUG + -Wall + -Wextra + -O3 + -Wno-packed + -Wno-missing-noreturn + -Wno-sign-conversion + -Wno-unused-macros -ffunction-sections + -fdata-sections -march=armv8.2-a+fp16fml ) + +if (CMAKE_CXX_COMPILER_ID STREQUAL "GNU") + target_compile_options(CMSISDSP PRIVATE -Wsign-compare - -Wdouble-promotion - -DNDEBUG - -Wall - -Wextra - -O3 - -ffast-math - -Wno-packed - -Wno-missing-variable-declarations - -Wno-missing-noreturn - -Wno-sign-conversion - -Wno-nonportable-include-path - -Wno-reserved-id-macro - -Wno-unused-macros - -Wno-documentation-unknown-command - -Wno-documentation - -Wno-parentheses-equality - -Wno-reserved-identifier - -ffunction-sections - -march=armv8.2-a+fp16fml) + -Wdouble-promotion + -Wfloat-conversion + -DNDEBUG + -Wall + -Wextra + -std=c11 + -O3 + -ffast-math + -Wno-packed + -Wno-missing-prototypes + -Wno-missing-noreturn + -Wno-sign-conversion + -Wno-unused-macros + -flax-vector-conversions + -Wno-maybe-uninitialized + -ffunction-sections + -fdata-sections + -march=armv8.2-a+fp16fml + -Wmissing-prototypes + ) + +else() + +target_compile_option(CMSISDSP PRIVATE -Wsign-compare + -Wdouble-promotion + -Wfloat-conversion + -DNDEBUG + -Wall + -Wextra + -Werror + -std=c11 + -O3 + -ffast-math + -Wno-packed + -Wno-missing-variable-declarations + -Wno-missing-prototypes + -Wno-missing-noreturn + -Wno-sign-conversion + -Wno-nonportable-include-path + -Wno-reserved-id-macro + -Wno-unused-macros + -Wno-documentation-unknown-command + -Wno-documentation + -Wno-parentheses-equality + -Wno-reserved-identifier + -ffunction-sections + -fdata-sections + -march=armv8.2-a+fp16fml + -Wmissing-prototypes +) + +endif() target_link_libraries(test PUBLIC CMSISDSP) @@ -205,4 +235,4 @@ target_link_libraries(test PUBLIC CMSISDSP) if(NOAUTOVEC) target_compile_options(CMSISDSP PRIVATE -fno-slp-vectorize -fno-vectorize) target_compile_options(test PRIVATE -fno-slp-vectorize -fno-vectorize ) -endif() \ No newline at end of file +endif() diff --git a/Testing/FrameworkInclude/Error.h b/Testing/FrameworkInclude/Error.h index 62698bd60..641400706 100644 --- a/Testing/FrameworkInclude/Error.h +++ b/Testing/FrameworkInclude/Error.h @@ -169,6 +169,8 @@ namespace Client { using namespace std; + + template void assert_equal(unsigned long nb,T pa, T pb) { @@ -179,6 +181,13 @@ void assert_equal(unsigned long nb,T pa, T pb) }; +#if defined(ARM_FLOAT16_SUPPORTED) + +template<> +void assert_equal(unsigned long nb,float16_t pa, float16_t pb); + +#endif + template void assert_equal_partial(unsigned long nb,unsigned long nbSamples,AnyPattern &pa, AnyPattern &pb) { @@ -209,7 +218,7 @@ void assert_equal_partial(unsigned long nb,unsigned long nbSamples,AnyPattern } catch(Error &err) { - sprintf(id," (nb=%lu)",i); + snprintf(id,40," (nb=%lu)",i); strcat(err.details,id); throw(err); } @@ -241,7 +250,7 @@ void assert_equal(unsigned long nb,AnyPattern &pa, AnyPattern &pb) } catch(Error &err) { - sprintf(id," (nb=%lu)",i); + snprintf(id,40," (nb=%lu)",i); strcat(err.details,id); throw(err); } @@ -262,6 +271,12 @@ void assert_near_equal(unsigned long nb,T pa, T pb, T threshold) } }; +#if defined(ARM_FLOAT16_SUPPORTED) +template <> +void assert_near_equal(unsigned long nb,float16_t pa, float16_t pb, float16_t threshold); + +#endif + template <> void assert_near_equal(unsigned long nb,double pa, double pb, double threshold); template <> @@ -307,7 +322,7 @@ void assert_near_equal(unsigned long nb,AnyPattern &pa, AnyPattern &pb, T } catch(Error &err) { - sprintf(id," (nb=%lu)",i); + snprintf(id,40," (nb=%lu)",i); strcat(err.details,id); throw(err); } diff --git a/Testing/FrameworkInclude/FPGA.h b/Testing/FrameworkInclude/FPGA.h index 04628ba87..430c249d7 100644 --- a/Testing/FrameworkInclude/FPGA.h +++ b/Testing/FrameworkInclude/FPGA.h @@ -47,7 +47,7 @@ FPGA driver. Used to read a C array describing how to drive the test. class FPGA:public IO { public: - FPGA(const char *testDesc,const char *patterns); + FPGA(const unsigned char *testDesc,const char *patterns); ~FPGA(); virtual void ReadIdentification(); virtual void ReadTestIdentification(); @@ -110,7 +110,7 @@ FPGA driver. Used to read a C array describing how to drive the test. void readChar(char *); // Driver array - const char *m_testDesc; + const unsigned char *m_testDesc; // Pattern array const char *m_patterns; @@ -119,7 +119,7 @@ FPGA driver. Used to read a C array describing how to drive the test. //char *m_parameters; // Current position in the driver array - const char *currentDesc; + const unsigned char *currentDesc; int currentKind; Testing::testID_t currentId; // Current param ID for the node diff --git a/Testing/FrameworkInclude/Test.h b/Testing/FrameworkInclude/Test.h index e66e8c3c1..5e084dddc 100644 --- a/Testing/FrameworkInclude/Test.h +++ b/Testing/FrameworkInclude/Test.h @@ -42,11 +42,15 @@ // Pattern files are containing hexadecimal values. // So we need to be able to convert some int into float without convertion -#define TOINT16(v) *((uint16_t*)&v) -#define TOINT32(v) *((uint32_t*)&v) -#define TOINT64(v) *((uint64_t*)&v) +//#define TOINT16(v) *((uint16_t*)&v) +//#define TOINT32(v) *((uint32_t*)&v) +//#define TOINT64(v) *((uint64_t*)&v) + +#define TOINT16(d,v) memcpy(&d,&v,2) +#define TOINT32(d,v) memcpy(&d,&v,4) +#define TOINT64(d,v) memcpy(&d,&v,8) // Or convert some float into a uint32 or uint64 without convertion -#define TOTYP(TYP,v) *((TYP*)&v) +//#define TOTYP(TYP,v) *((TYP*)&v) // So it is a cast and not a data conversion. // (uint32_t)1.0 would give 1. We want the hexadecimal representation of the float. // TOINT32(1.0) can be used diff --git a/Testing/FrameworkInclude/Timing.h b/Testing/FrameworkInclude/Timing.h index f09e5c55c..37c1d4f2c 100644 --- a/Testing/FrameworkInclude/Timing.h +++ b/Testing/FrameworkInclude/Timing.h @@ -16,6 +16,7 @@ void cycleMeasurementStop(); Testing::cycles_t getCycles(); + #if defined(EXTBENCH) || defined(CACHEANALYSIS) extern unsigned long sectionCounter; diff --git a/Testing/FrameworkSource/FPGA.cpp b/Testing/FrameworkSource/FPGA.cpp index 466652d2a..a349824dc 100644 --- a/Testing/FrameworkSource/FPGA.cpp +++ b/Testing/FrameworkSource/FPGA.cpp @@ -54,7 +54,7 @@ namespace Client int dimensions; }; - FPGA::FPGA(const char *testDesc,const char *patterns) + FPGA::FPGA(const unsigned char *testDesc,const char *patterns) { this->m_testDesc=testDesc; this->m_patterns=patterns; @@ -736,7 +736,7 @@ namespace Client for(i=0; i < nb; i++) { v = data[i]; - t = TOINT64(v); + TOINT64(t,v); #if __SIZEOF_LONG__ == 8 printf("D: 0x%016lx\n",t); #else @@ -759,7 +759,7 @@ namespace Client for(i=0; i < nb; i++) { v = data[i]; - t = TOINT32(v); + TOINT32(t,v); printf("D: 0x%08x\n",t); } printf("D: END\n"); @@ -779,7 +779,7 @@ namespace Client for(i=0; i < nb; i++) { v = data[i]; - t = TOINT16(v); + TOINT16(t,v); printf("D: 0x0000%04x\n",t); } printf("D: END\n"); diff --git a/Testing/PatternGeneration/BIQUAD.py b/Testing/PatternGeneration/BIQUAD.py index 9848bd59e..fde4bb140 100755 --- a/Testing/PatternGeneration/BIQUAD.py +++ b/Testing/PatternGeneration/BIQUAD.py @@ -183,7 +183,12 @@ def generatePatterns(): configq15=Tools.Config(PATTERNDIR,PARAMDIR,"q15") #configq7=Tools.Config(PATTERNDIR,PARAMDIR,"q7") - + configf64.setOverwrite(False) + configf32.setOverwrite(False) + configf16.setOverwrite(False) + configq31.setOverwrite(False) + configq15.setOverwrite(False) + writeBenchmarks(configf32) writeBenchmarks(configf16) @@ -191,7 +196,9 @@ def generatePatterns(): writeBenchmarks(configq15) writeBenchmarks(configf64) + #configf32.setOverwrite(True) writeTests(configf32,0) + writeTests(configf16,16) writeTests(configq31,31) writeTests(configq15,15) diff --git a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadCoefs2_f32.txt b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadCoefs2_f32.txt index 5f31aa1d2..bf4536f76 100755 --- a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadCoefs2_f32.txt +++ b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadCoefs2_f32.txt @@ -2,661 +2,661 @@ W 330 // 0.020000 0x3ca3d70a -// 0.012037 -0x3c4537e4 +// -0.031581 +0xbd015b61 // 0.020000 0x3ca3d70a -// 0.199104 -0x3e4be208 -// -0.012306 -0xbc499fe1 +// -0.531387 +0xbf080900 +// -0.158503 +0xbe224e9b // 1.000000 0x3f800000 -// 1.889097 -0x3ff1cdec +// -1.432153 +0xbfb750ce // 1.000000 0x3f800000 -// -0.949678 -0xbf731e19 -// -0.236693 -0xbe725f8a +// 0.528900 +0x3f076601 +// -0.259727 +0xbe84faf0 // 1.000000 0x3f800000 -// 1.037196 -0x3f84c2d6 +// 1.812335 +0x3fe7fa9a // 1.000000 0x3f800000 -// -0.495325 -0xbefd9b34 -// -0.313520 -0xbea085a6 +// -0.584219 +0xbf158f68 +// -0.402448 +0xbece0db7 // 0.020000 0x3ca3d70a -// -0.024479 -0xbcc888ab +// 0.038959 +0x3d1f93e6 // 0.020000 0x3ca3d70a -// -0.471932 -0xbef1a105 -// -0.082296 -0xbda88ab3 +// 0.128865 +0x3e03f511 +// -0.004751 +0xbb9babee // 1.000000 0x3f800000 -// -0.874890 -0xbf5ff8c6 +// 0.411919 +0x3ed2e703 // 1.000000 0x3f800000 -// -0.863779 -0xbf5d20a3 -// -0.208806 -0xbe55d122 +// 0.455310 +0x3ee91e56 +// -0.171682 +0xbe2fcd81 // 1.000000 0x3f800000 -// -0.827090 -0xbf53bc2c +// -1.057378 +0xbf87582c // 1.000000 0x3f800000 -// -1.384395 -0xbfb133d9 -// -0.481299 -0xbef66cd1 +// 0.866829 +0x3f5de87f +// -0.193644 +0xbe464aa2 // 0.020000 0x3ca3d70a -// 0.038033 -0x3d1bc833 +// 0.039928 +0x3d238bdb // 0.020000 0x3ca3d70a -// -0.032064 -0xbd0355e1 -// -0.000267 -0xb98bf1f3 +// -0.239197 +0xbe74f024 +// -0.016478 +0xbc86fd09 // 1.000000 0x3f800000 -// 1.474981 -0x3fbccc2c +// 1.801009 +0x3fe68778 // 1.000000 0x3f800000 -// 0.007100 -0x3be8a4a2 -// -0.001515 -0xbac68db9 +// 0.352178 +0x3eb4509f +// -0.033044 +0xbd075989 // 1.000000 0x3f800000 -// -1.887427 -0xbff19732 +// 0.808023 +0x3f4eda9f // 1.000000 0x3f800000 -// 0.899127 -0x3f662d36 -// -0.384210 -0xbec4b721 +// -0.653058 +0xbf272ec7 +// -0.302649 +0xbe9af4df // 0.020000 0x3ca3d70a -// -0.013804 -0xbc622b92 +// 0.038303 +0x3d1ce381 // 0.020000 0x3ca3d70a -// -0.117502 -0xbdf0a4fa -// -0.012055 -0xbc45833d +// -0.088482 +0xbdb53646 +// -0.002723 +0xbb326f0f // 1.000000 0x3f800000 -// 1.078180 -0x3f8a01cb +// 1.800439 +0x3fe674cc // 1.000000 0x3f800000 -// -0.129681 -0xbe04cb2b -// -0.033098 -0xbd079165 +// -0.068233 +0xbd8bbdca +// -0.028340 +0xbce82a14 // 1.000000 0x3f800000 -// 0.996541 -0x3f7f1d51 +// -0.494890 +0xbefd6245 // 1.000000 0x3f800000 -// -0.194323 -0xbe46fc7e -// -0.038220 -0xbd1c8ce6 +// 0.644288 +0x3f24f014 +// -0.135080 +0xbe0a5258 // 1.000000 0x3f800000 -// -0.687177 -0xbf2feada +// -0.899707 +0xbf66533b // 1.000000 0x3f800000 -// 0.063508 -0x3d82109a -// -0.042775 -0xbd2f34ea +// 0.759627 +0x3f4276f1 +// -0.147634 +0xbe172d7c // 1.000000 0x3f800000 -// 1.704006 -0x3fda1cdb +// -1.416380 +0xbfb54bee // 1.000000 0x3f800000 -// -0.548171 -0xbf0c54e7 -// -0.084293 -0xbdaca1a4 +// 0.916055 +0x3f6a8291 +// -0.219946 +0xbe613991 // 1.000000 0x3f800000 -// -0.628642 -0xbf20eeb1 +// 1.990599 +0x3ffecbef // 1.000000 0x3f800000 -// 0.199490 -0x3e4c4735 -// -0.156659 -0xbe206b56 +// -1.059943 +0xbf87ac3a +// -0.281632 +0xbe90320e // 1.000000 0x3f800000 -// -1.965964 -0xbffba4b8 +// -1.926106 +0xbff68aa7 // 1.000000 0x3f800000 -// 0.678742 -0x3f2dc202 -// -0.169337 -0xbe2d66a5 +// 1.103400 +0x3f8d3c3a +// -0.306292 +0xbe9cd25c // 1.000000 0x3f800000 -// 0.052987 -0x3d590906 +// 1.560152 +0x3fc7b313 // 1.000000 0x3f800000 -// -0.347633 -0xbeb1fce7 -// -0.485736 -0xbef8b263 +// -1.086739 +0xbf8b1a41 +// -0.421309 +0xbed7b5d8 // 0.020000 0x3ca3d70a -// 0.039890 -0x3d236345 +// 0.038738 +0x3d1eabf5 // 0.020000 0x3ca3d70a -// -0.059243 -0xbd72a875 -// -0.000878 -0xba66091c +// 0.086617 +0x3db16429 +// -0.004329 +0xbb8dd9f7 // 1.000000 0x3f800000 -// 1.979571 -0x3ffd6291 +// 1.815065 +0x3fe8540a // 1.000000 0x3f800000 -// -0.045561 -0xbd3a9e51 -// -0.009813 -0xbc20c6a3 +// 0.155334 +0x3e1f0fc1 +// -0.027329 +0xbcdfe078 // 1.000000 0x3f800000 -// -0.233140 -0xbe6ebc3f +// 0.159722 +0x3e238e48 // 1.000000 0x3f800000 -// 0.229830 -0x3e6b5871 -// -0.016231 -0xbc84f62a +// 0.015496 +0x3c7de2a2 +// -0.054544 +0xbd5f6996 // 1.000000 0x3f800000 -// -0.438341 -0xbee06e37 +// -1.224166 +0xbf9cb177 // 1.000000 0x3f800000 -// 0.204474 -0x3e516193 -// -0.021394 -0xbcaf42f2 +// 0.374463 +0x3ebfb9a7 +// -0.098741 +0xbdca38da // 1.000000 0x3f800000 -// 1.640090 -0x3fd1ee78 +// 1.807725 +0x3fe7638b // 1.000000 0x3f800000 -// -0.341116 -0xbeaea6cd -// -0.087470 -0xbdb3237b +// -0.556513 +0xbf0e779b +// -0.135965 +0xbe0b3a54 // 1.000000 0x3f800000 -// -0.776720 -0xbf46d727 +// -1.550145 +0xbfc66b23 // 1.000000 0x3f800000 -// 0.281065 -0x3e8fe7d1 -// -0.156631 -0xbe2063e0 +// 0.946455 +0x3f724ada +// -0.224304 +0xbe65afd9 // 1.000000 0x3f800000 -// -1.600251 -0xbfccd506 +// 0.691822 +0x3f311b41 // 1.000000 0x3f800000 -// 0.844595 -0x3f583767 -// -0.191939 -0xbe448ba6 +// -0.461062 +0xbeec1056 +// -0.332094 +0xbeaa0840 // 1.000000 0x3f800000 -// 0.040010 -0x3d23e128 +// -1.886400 +0xbff1758f // 1.000000 0x3f800000 -// -0.210694 -0xbe57c043 -// -0.376728 -0xbec0e285 +// 1.184259 +0x3f9795cd +// -0.393030 +0xbec93b31 // 0.020000 0x3ca3d70a -// 0.038789 -0x3d1ee0b2 +// -0.039488 +0xbd21beac // 0.020000 0x3ca3d70a -// 0.091082 -0x3dba8964 -// -0.002485 -0xbb22da4f +// -0.028692 +0xbceb0afb +// -0.000320 +0xb9a791d1 // 1.000000 0x3f800000 -// 1.898529 -0x3ff302fc +// -1.872281 +0xbfefa6ec // 1.000000 0x3f800000 -// 0.093405 -0x3dbf4b31 -// -0.005958 -0xbbc33824 +// 0.069167 +0x3d8da780 +// -0.006413 +0xbbd2252c // 1.000000 0x3f800000 -// 1.831999 -0x3fea7ef0 +// 1.985059 +0x3ffe166c // 1.000000 0x3f800000 -// -0.055416 -0xbd62fbcc -// -0.006199 -0xbbcb1d49 +// -0.334913 +0xbeab79c4 +// -0.053677 +0xbd5bdc55 // 1.000000 0x3f800000 -// 1.808033 -0x3fe76d9e +// 1.469019 +0x3fbc08d0 // 1.000000 0x3f800000 -// -0.027387 -0xbce05a56 -// -0.021675 -0xbcb1908b +// -0.254367 +0xbe823c69 +// -0.058502 +0xbd6fa00e // 1.000000 0x3f800000 -// 1.030738 -0x3f83ef38 +// -1.868942 +0xbfef397f // 1.000000 0x3f800000 -// 0.318118 -0x3ea2e05d -// -0.028561 -0xbce9f862 +// 0.187965 +0x3e4079e5 +// -0.087157 +0xbdb27f36 // 1.000000 0x3f800000 -// 1.855541 -0x3fed8262 +// -1.660115 +0xbfd47ea9 // 1.000000 0x3f800000 -// -0.612809 -0xbf1ce115 -// -0.109676 -0xbde09de6 +// 0.410856 +0x3ed25ba9 +// -0.184741 +0xbe3d2caa // 1.000000 0x3f800000 -// -1.547572 -0xbfc616d5 +// -0.087453 +0xbdb31aa2 // 1.000000 0x3f800000 -// 0.622561 -0x3f1f602c -// -0.126454 -0xbe017d15 +// 0.377120 +0x3ec115e2 +// -0.221524 +0xbe62d71b // 1.000000 0x3f800000 -// -0.045237 -0xbd394a0c +// -1.572203 +0xbfc93df1 // 1.000000 0x3f800000 -// 0.243642 -0x3e797d54 -// -0.322207 -0xbea4f84a +// 0.879188 +0x3f61127d +// -0.433036 +0xbeddb6d5 // 0.020000 0x3ca3d70a -// 0.038807 -0x3d1ef3ca +// 0.039726 +0x3d22b749 // 0.020000 0x3ca3d70a -// 0.083747 -0x3dab83b1 -// -0.003924 -0xbb80940d +// -0.067437 +0xbd8a1c3e +// -0.001169 +0xba993895 // 1.000000 0x3f800000 -// 1.781231 -0x3fe3ff5d +// 1.965514 +0x3ffb95f9 // 1.000000 0x3f800000 -// -0.188276 -0xbe40cb7e -// -0.012151 -0xbc4713ed +// -0.098647 +0xbdca0795 +// -0.005399 +0xbbb0eba8 // 1.000000 0x3f800000 -// 1.418355 -0x3fb58cab +// 1.959676 +0x3ffad6a7 // 1.000000 0x3f800000 -// 0.187357 -0x3e3fda77 -// -0.049920 -0xbd4c7967 +// 0.152078 +0x3e1bba3e +// -0.006162 +0xbbc9ebb5 // 1.000000 0x3f800000 -// 1.924918 -0x3ff663b4 +// 1.907803 +0x3ff432e0 // 1.000000 0x3f800000 -// -0.451611 -0xbee73997 -// -0.058635 -0xbd702bc4 +// -0.486125 +0xbef8e56e +// -0.063419 +0xbd81e1e2 // 1.000000 0x3f800000 -// 0.776756 -0x3f46d974 +// 0.191909 +0x3e4483ba // 1.000000 0x3f800000 -// 0.552291 -0x3f0d62f9 -// -0.077941 -0xbd9f9f9a +// 0.400997 +0x3ecd4f74 +// -0.094502 +0xbdc18a3a // 1.000000 0x3f800000 -// 1.184366 -0x3f97994d +// 0.753238 +0x3f40d435 // 1.000000 0x3f800000 -// -0.397430 -0xbecb7be9 -// -0.101465 -0xbdcfccc5 +// -0.373739 +0xbebf5aa8 +// -0.096328 +0xbdc5477f // 1.000000 0x3f800000 -// 1.995827 -0x3fff7741 +// -1.776952 +0xbfe37328 // 1.000000 0x3f800000 -// -0.645810 -0xbf2553d1 -// -0.104271 -0xbdd58c04 +// 0.646821 +0x3f259609 +// -0.104696 +0xbdd66ada // 1.000000 0x3f800000 -// -1.863420 -0xbfee8488 +// 1.887964 +0x3ff1a8cb // 1.000000 0x3f800000 -// 0.646199 -0x3f256d44 -// -0.113331 -0xbde819e8 +// -0.800252 +0xbf4cdd4e +// -0.200731 +0xbe4d8c62 // 1.000000 0x3f800000 -// -1.752569 -0xbfe05432 +// -1.887493 +0xbff1995c // 1.000000 0x3f800000 -// 0.631625 -0x3f21b227 -// -0.134006 -0xbe0938f1 +// 1.099672 +0x3f8cc20b +// -0.316940 +0xbea24606 // 1.000000 0x3f800000 -// -1.623323 -0xbfcfc90b +// -1.078741 +0xbf8a1432 // 1.000000 0x3f800000 -// 0.602597 -0x3f1a43cf -// -0.162854 -0xbe26c338 +// 0.661788 +0x3f296aed +// -0.346694 +0xbeb181e0 // 1.000000 0x3f800000 -// -1.977609 -0xbffd2247 +// -0.903780 +0xbf675e20 // 1.000000 0x3f800000 -// 0.983587 -0x3f7bcc55 -// -0.251309 -0xbe80ab96 +// 0.245661 +0x3e7b8e7c +// -0.351599 +0xbeb404bb // 0.020000 0x3ca3d70a -// -0.017903 -0xbc92a917 +// 0.039548 +0x3d21fd7b // 0.020000 0x3ca3d70a -// -0.034908 -0xbd0efc03 -// -0.003146 -0xbb4e25cb +// -0.028886 +0xbceca154 +// -0.000590 +0xba1aac41 // 1.000000 0x3f800000 -// 0.361548 -0x3eb91cd3 +// 1.966938 +0x3ffbc49d // 1.000000 0x3f800000 -// -0.090211 -0xbdb8c052 -// -0.004580 -0xbb9614fd +// -0.131080 +0xbe0639bc +// -0.005368 +0xbbafe4ab // 1.000000 0x3f800000 -// 0.767944 -0x3f4497fc +// -0.027922 +0xbce4bba9 // 1.000000 0x3f800000 -// -0.079952 -0xbda3be0c -// -0.012337 -0xbc4a203f +// 0.223636 +0x3e6500dd +// -0.019312 +0xbc9e34c9 // 1.000000 0x3f800000 -// 0.936274 -0x3f6fafa5 +// 1.819395 +0x3fe8e1f3 // 1.000000 0x3f800000 -// -0.178513 -0xbe36cc00 -// -0.034154 -0xbd0be585 +// -0.282467 +0xbe909f8c +// -0.023534 +0xbcc0c9d8 // 1.000000 0x3f800000 -// 0.231904 -0x3e6d7857 +// 1.749549 +0x3fdff138 // 1.000000 0x3f800000 -// -0.025949 -0xbcd49373 -// -0.059723 -0xbd74a00a +// -0.228462 +0xbe69f1de +// -0.030071 +0xbcf65671 // 1.000000 0x3f800000 -// -1.042340 -0xbf856b67 +// -0.883253 +0xbf621ce2 // 1.000000 0x3f800000 -// 0.728804 -0x3f3a92ed -// -0.133781 -0xbe08fde1 +// 0.175262 +0x3e3377ca +// -0.067231 +0xbd89b078 // 1.000000 0x3f800000 -// 0.957638 -0x3f7527c5 +// -1.996597 +0xbfff907c // 1.000000 0x3f800000 -// -0.681966 -0xbf2e9558 -// -0.178044 -0xbe365144 +// 0.535847 +0x3f092d44 +// -0.072625 +0xbd94bc72 // 1.000000 0x3f800000 -// -1.374160 -0xbfafe47a +// -1.941479 +0xbff88264 // 1.000000 0x3f800000 -// 0.984319 -0x3f7bfc50 -// -0.295302 -0xbe9731c6 +// 0.758777 +0x3f423f33 +// -0.163720 +0xbe27a630 // 1.000000 0x3f800000 -// -1.502140 -0xbfc0461f +// -1.935602 +0xbff7c1cf // 1.000000 0x3f800000 -// 1.079661 -0x3f8a3254 -// -0.320158 -0xbea3ebb3 +// 0.774382 +0x3f463de2 +// -0.168712 +0xbe2cc2ca // 1.000000 0x3f800000 -// -0.176259 -0xbe347d51 +// 1.233421 +0x3f9de0bb // 1.000000 0x3f800000 -// 0.075974 -0x3d9b9805 -// -0.336093 -0xbeac1463 +// -0.549261 +0xbf0c9c5c +// -0.270842 +0xbe8aabd4 // 1.000000 0x3f800000 -// -1.997183 -0xbfffa3b5 +// 1.876669 +0x3ff036b4 // 1.000000 0x3f800000 -// 1.260405 -0x3fa154f6 -// -0.406372 -0xbed00ffb +// -1.171951 +0xbf96027a +// -0.375677 +0xbec058ca // 0.020000 0x3ca3d70a -// 0.002067 -0x3b077d7d +// -0.022851 +0xbcbb32a6 // 0.020000 0x3ca3d70a -// -0.054644 -0xbd5fd22f -// -0.001188 -0xba9bb410 +// -0.004679 +0xbb994f6f +// -0.000035 +0xb810b8d2 // 1.000000 0x3f800000 -// 0.063542 -0x3d82227c +// -1.052142 +0xbf86ac99 // 1.000000 0x3f800000 -// 0.038380 -0x3d1d349f -// -0.002330 -0xbb18b85a +// -0.285572 +0xbe923670 +// -0.023704 +0xbcc22e6c // 1.000000 0x3f800000 -// -1.308848 -0xbfa78858 +// -1.836362 +0xbfeb0dec // 1.000000 0x3f800000 -// 0.201415 -0x3e4e3fb8 -// -0.010154 -0xbc265e7a +// 0.258988 +0x3e849a17 +// -0.024142 +0xbcc5c547 // 1.000000 0x3f800000 -// 0.324443 -0x3ea61d65 +// -0.577506 +0xbf13d769 // 1.000000 0x3f800000 -// -0.202344 -0xbe4f335c -// -0.035189 -0xbd1022a9 +// 0.011071 +0x3c3563e6 +// -0.039124 +0xbd204021 // 1.000000 0x3f800000 -// 0.183186 -0x3e3b9525 +// -0.278633 +0xbe8ea909 // 1.000000 0x3f800000 -// -0.037334 -0xbd18ebdd -// -0.035224 -0xbd104721 +// -0.403757 +0xbeceb93b +// -0.048708 +0xbd4781b2 // 1.000000 0x3f800000 -// 0.371348 -0x3ebe215e +// -0.256368 +0xbe8342aa // 1.000000 0x3f800000 -// -0.415932 -0xbed4f50b -// -0.045002 -0xbd385402 +// -0.446170 +0xbee47056 +// -0.051266 +0xbd51fc41 // 1.000000 0x3f800000 -// 0.620615 -0x3f1ee0a2 +// -1.752522 +0xbfe052a0 // 1.000000 0x3f800000 -// -0.438865 -0xbee0b2f1 -// -0.049304 -0xbd49f354 +// 0.661849 +0x3f296eed +// -0.170033 +0xbe2e1d1d // 1.000000 0x3f800000 -// 1.855075 -0x3fed7316 +// 0.311358 +0x3e9f6a45 // 1.000000 0x3f800000 -// -0.520948 -0xbf055cd5 -// -0.084570 -0xbdad3318 +// -0.366131 +0xbebb757e +// -0.176086 +0xbe344fe9 // 1.000000 0x3f800000 -// -0.082484 -0xbda8ed71 +// 1.127194 +0x3f9047e3 // 1.000000 0x3f800000 -// 0.039669 -0x3d227c25 -// -0.104842 -0xbdd6b75f +// -0.882441 +0xbf61e7a6 +// -0.234757 +0xbe70643d // 1.000000 0x3f800000 -// 0.710359 -0x3f35da0f +// 0.659264 +0x3f28c586 // 1.000000 0x3f800000 -// -0.353830 -0xbeb5293e -// -0.245166 -0xbe7b0caf +// -0.281161 +0xbe8ff460 +// -0.246255 +0xbe7c2a4b // 1.000000 0x3f800000 -// 1.961346 -0x3ffb0d63 +// 1.999415 +0x3fffecd2 // 1.000000 0x3f800000 -// -1.326857 -0xbfa9d672 -// -0.468162 -0xbeefb2fb +// -0.916118 +0xbf6a86b1 +// -0.262476 +0xbe866342 diff --git a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadInputs2_f32.txt b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadInputs2_f32.txt index ac94a21d3..feeb6a4ad 100755 --- a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadInputs2_f32.txt +++ b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadInputs2_f32.txt @@ -1,134 +1,134 @@ W 66 +// 0.088448 +0x3db52433 // 1.000000 0x3f800000 -// 0.512719 -0x3f034193 -// -0.657915 -0xbf286d19 -// -0.447759 -0xbee540a5 -// 0.162976 -0x3e26e33b -// -0.626536 -0xbf2064a6 -// 0.941290 -0x3f70f85c -// -0.271793 -0xbe8b287e -// -1.000000 -0xbf800000 -// 0.239723 -0x3e7579ed -// -0.367794 -0xbebc4f72 -// -0.669104 -0xbf2b4a68 -// -0.563614 -0xbf104907 -// 0.019646 -0x3ca0f100 -// -0.741586 -0xbf3dd896 -// -0.686987 -0xbf2fde5c -// 0.632335 -0x3f21e0b3 -// 0.623159 -0x3f1f8754 +// -0.372630 +0xbebec96a +// 0.236714 +0x3e72652b +// 0.040559 +0x3d2620eb +// 0.497331 +0x3efea238 // 1.000000 0x3f800000 -// -0.134520 -0xbe09bfba -// -0.047935 -0xbd4457e9 -// 0.883679 -0x3f6238c4 -// -0.750073 -0xbf4004c9 -// -1.000000 -0xbf800000 -// 0.956342 -0x3f74d2d6 +// -0.185166 +0xbe3d9c1a +// 0.180820 +0x3e3928e0 +// 0.035388 +0x3d10f31f +// 0.575066 +0x3f133785 +// 0.517456 +0x3f047807 +// 0.172057 +0x3e302fb2 +// -0.438195 +0xbee05b21 // 1.000000 0x3f800000 -// 0.286657 -0x3e92c4b5 -// 0.276657 -0x3e8da5fa -// -0.041531 -0xbd2a1c65 -// -0.086568 -0xbdb14ac5 -// -0.272279 -0xbe8b6825 -// -0.075193 -0xbd99fec1 -// -0.135883 -0xbe0b24db -// 0.128069 -0x3e03246e -// -0.395272 -0xbeca6126 -// -0.493562 -0xbefcb439 -// 0.241812 -0x3e779dad -// -0.003724 -0xbb74140c -// -0.436178 -0xbedf52bc +// 0.565706 +0x3f10d21b +// -0.464682 +0xbeedeac1 +// 0.511738 +0x3f030145 +// 0.181040 +0x3e396290 +// 0.573825 +0x3f12e631 +// 0.505163 +0x3f015256 +// 0.314493 +0x3ea10549 // 1.000000 0x3f800000 -// -0.316548 -0xbea21297 -// -0.356192 -0xbeb65edc -// -0.537246 -0xbf0988f0 -// 0.401044 -0x3ecd5598 -// 0.135919 -0x3e0b2e78 -// -0.343346 -0xbeafcb0f +// 0.511088 +0x3f02d6aa +// -0.801524 +0xbf4d30b3 +// 0.026629 +0x3cda2572 +// -0.628458 +0xbf20e299 +// 0.411890 +0x3ed2e33b +// 0.523545 +0x3f06070e +// -0.174923 +0xbe331f19 +// -0.079613 +0xbda30c06 // -1.000000 0xbf800000 -// -0.055716 -0xbd643694 -// -0.149905 -0xbe1980a7 -// 0.440345 -0x3ee174e4 -// 0.255234 -0x3e82ae0e -// 0.242254 -0x3e78118b -// -0.352286 -0xbeb45ecd -// 0.922015 -0x3f6c0927 +// 0.058599 +0x3d70053f +// 0.120343 +0x3df67667 +// -0.040746 +0xbd26e4c3 +// 0.248106 +0x3e7e0f9d // -1.000000 0xbf800000 -// -0.212721 -0xbe59d39d -// -0.464466 -0xbeedce8c -// -0.719272 -0xbf382234 -// 0.456527 -0x3ee9bde9 +// 0.367631 +0x3ebc3a13 +// 0.325216 +0x3ea682be +// -0.120742 +0xbdf74761 +// 0.612524 +0x3f1cce5e +// -0.395595 +0xbeca8b76 +// -0.573885 +0xbf12ea20 +// -0.409574 +0xbed1b3b1 +// 0.706652 +0x3f34e720 +// -0.280305 +0xbe8f842a // -1.000000 0xbf800000 -// 0.117568 -0x3df0c786 -// 0.524351 -0x3f063be1 -// -0.368739 -0xbebccb5b -// -0.330865 -0xbea9671c -// -0.137054 -0xbe0c57d3 -// 0.084210 -0x3dac7612 +// -0.100229 +0xbdcd44bc +// 0.461258 +0x3eec29f6 +// 0.578507 +0x3f141901 +// 1.000000 +0x3f800000 +// 0.097858 +0x3dc86998 +// 0.324241 +0x3ea602fb +// -0.733889 +0xbf3be02e +// 0.771988 +0x3f45a107 +// -0.443468 +0xbee30e39 +// 1.000000 +0x3f800000 +// -0.075500 +0xbd9a9f89 +// -0.481116 +0xbef654d1 +// -0.400417 +0xbecd0378 +// 0.126203 +0x3e013b5d +// 0.633901 +0x3f224754 +// -0.043814 +0xbd337694 +// -0.516305 +0xbf042c96 +// 0.031491 +0x3d00fc6e +// 0.103479 +0x3dd3ece1 diff --git a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadRefs2_f32.txt b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadRefs2_f32.txt index 4338027d6..d1817de66 100755 --- a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadRefs2_f32.txt +++ b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadRefs2_f32.txt @@ -1,134 +1,134 @@ W 66 +// 0.001769 +0x3ae7dc6a +// 0.016841 +0x3c89f6e8 +// -0.042615 +0xbd2e8ce7 +// 0.004734 +0x3b9b2207 +// 0.013847 +0x3c62dedf +// 0.032856 +0x3d069471 +// 0.078673 +0x3da11f78 +// 0.130797 +0x3e05efb2 +// 0.176154 +0x3e3461cb +// 0.212493 +0x3e5997bd +// 0.233657 +0x3e6f43c1 +// 0.010349 +0x3c298f65 +// 0.045514 +0x3d3a6d14 +// 0.080507 +0x3da4e102 +// 0.086535 +0x3db13981 +// 0.100651 +0x3dce224b +// 0.144454 +0x3e13ebc1 +// 0.168426 +0x3e2c77ce +// 0.141546 +0x3e10f156 +// 0.106673 +0x3dda7722 +// 0.129507 +0x3e049d74 +// 0.193405 +0x3e460bde // 0.020000 0x3ca3d70a -// 0.055900 -0x3d64f6e7 -// 0.072883 -0x3d9543cc -// -0.008955 -0xbc12b8bc -// 0.053821 -0x3d5c7346 -// -0.193340 -0xbe45faed -// 0.513563 -0x3f0378e3 -// -1.109050 -0xbf8df559 -// 2.009222 -0x40009718 -// -3.098030 -0xc0464621 -// 4.080722 -0x40829547 -// -0.013382 -0xbc5b4085 -// -0.042899 -0xbd2fb6ba -// -0.041428 -0xbd29b07c -// 0.002628 -0x3b2c3898 -// 0.015366 -0x3c7bc19a -// -0.000976 -0xba7fed63 -// 0.036623 -0x3d160196 -// 0.093172 -0x3dbed0f0 -// 0.044981 -0x3d383dcf -// -0.082501 -0xbda8f659 -// -0.119776 -0xbdf54d25 -// -0.015001 -0xbc75c8af -// -0.011961 -0xbc43f9a7 -// -0.007406 -0xbbf2b03c -// 0.020000 -0x3ca3d70a -// 0.075914 -0x3d9b78d8 -// 0.162109 -0x3e25fff0 -// 0.301184 -0x3e9a34d1 -// 0.474970 -0x3ef32f44 -// 0.621514 -0x3f1f1b8a -// 0.746168 -0x3f3f04e3 -// 0.832243 -0x3f550dde -// 0.002561 -0x3b27dcb6 -// 0.016286 -0x3c8569dd -// 0.023050 -0x3cbcd362 -// -0.120717 -0xbdf73a80 -// -0.705511 -0xbf349c5a -// -1.904387 -0xbff3c2f2 -// -3.425609 -0xc05b3d2e -// -4.592662 -0xc092f716 -// -4.868969 -0xc09bce97 -// -4.313825 -0xc08a0adb -// -3.625409 -0xc06806b5 -// 0.002718 -0x3b322700 -// 0.008925 -0x3c12386f -// -0.025665 -0xbcd23f35 -// -0.001114 -0xba920e74 -// -0.002224 -0xbb11c874 -// 0.004722 -0x3b9ab905 -// -0.012871 -0xbc52df41 -// 0.045150 -0x3d38eee2 -// -0.053628 -0xbd5ba88b -// 0.170905 -0x3e2f01be -// -0.180991 -0xbe3955ce -// -0.004254 -0xbb8b68b7 -// -0.016652 -0xbc886a6a -// -0.062913 -0xbd80d8c2 -// -0.132137 -0xbe074ee7 -// -0.316513 -0xbea20e09 -// -0.465959 -0xbeee9221 -// -0.846801 -0xbf58c7f2 -// -0.993027 -0xbf7e3707 -// -1.428914 -0xbfb6e6a5 -// -1.477528 -0xbfbd1fa2 -// -1.685673 -0xbfd7c425 +// 0.083206 +0x3daa680a +// 0.136475 +0x3e0bbffd +// 0.000533 +0x3a0b9d16 +// -0.010707 +0xbc2f6e59 +// -0.032931 +0xbd06e2d4 +// -0.023462 +0xbcc03408 +// 0.017265 +0x3c8d6e8f +// 0.027164 +0x3cde8711 +// -0.020278 +0xbca61de9 +// -0.091577 +0xbdbb8c98 +// 0.002407 +0x3b1dbc6b +// -0.011104 +0xbc35eeb9 +// 0.021992 +0x3cb4285d +// -0.042897 +0xbd2fb4e7 +// 0.098282 +0x3dc947e1 +// -0.112608 +0xbde69ee7 +// -0.050841 +0xbd503e68 +// 0.256241 +0x3e8331fc +// -0.206155 +0xbe531a6a +// -0.028113 +0xbce64c47 +// 0.161414 +0x3e2549ba +// 0.014133 +0x3c678e3d +// 0.084651 +0x3dad5d5c +// 0.190052 +0x3e429cfa +// -0.002005 +0xbb035f31 +// 0.001379 +0x3ab4b131 +// 0.040846 +0x3d274e86 +// 0.109656 +0x3de0934c +// 0.089274 +0x3db6d568 +// -0.114022 +0xbde98473 +// -0.350637 +0xbeb386ad +// -0.334898 +0xbeab77b2 +// -0.008869 +0xbc1150c8 +// 0.068364 +0x3d8c02af +// -0.273895 +0xbe8c3c03 +// 0.766872 +0x3f4451b6 +// -1.667028 +0xbfd5612b +// 2.959857 +0x403d6e4b +// -4.393206 +0xc08c9525 +// 5.463283 +0x40aed336 +// -5.541438 +0xc0b15376 +// 4.127624 +0x40841580 +// -1.129602 +0xbf9096d0 diff --git a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoInputs2_f32.txt b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoInputs2_f32.txt index 858737463..e50959cfb 100755 --- a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoInputs2_f32.txt +++ b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoInputs2_f32.txt @@ -1,266 +1,266 @@ W 132 +// 0.088448 +0x3db52433 +// 0.163785 +0x3e27b73c // 1.000000 0x3f800000 -// 0.561685 -0x3f0fca96 -// 0.512719 -0x3f034193 -// 0.272361 -0x3e8b72e4 -// -0.657915 -0xbf286d19 -// -1.000000 -0xbf800000 -// -0.447759 -0xbee540a5 -// -0.020237 -0xbca5c85b -// 0.162976 -0x3e26e33b -// -0.538756 -0xbf09ebf0 -// -0.626536 -0xbf2064a6 -// -0.213121 -0xbe5a3c55 -// 0.941290 -0x3f70f85c -// -0.471829 -0xbef1939c -// -0.271793 -0xbe8b287e -// -0.375274 -0xbec023d9 -// -1.000000 -0xbf800000 -// -0.068524 -0xbd8c5657 -// 0.239723 -0x3e7579ed -// -1.000000 -0xbf800000 -// -0.367794 -0xbebc4f72 -// -0.280300 -0xbe8f8384 -// -0.669104 -0xbf2b4a68 -// -0.402517 -0xbece16c6 -// -0.563614 -0xbf104907 -// -0.314083 -0xbea0cf77 -// 0.019646 -0x3ca0f100 -// 0.710846 -0x3f35f9fe -// -0.741586 -0xbf3dd896 +// 0.757137 +0x3f41d3c3 +// -0.372630 +0xbebec96a // 1.000000 0x3f800000 -// -0.686987 -0xbf2fde5c -// -0.298660 -0xbe98e9f8 -// 0.632335 -0x3f21e0b3 -// -0.750783 -0xbf403348 -// 0.623159 -0x3f1f8754 -// -0.082167 -0xbda8470e +// 0.236714 +0x3e72652b +// 0.088115 +0x3db4759a +// 0.040559 +0x3d2620eb +// -0.611261 +0xbf1c7ba0 +// 0.497331 +0x3efea238 +// -0.819514 +0xbf51cbaf // 1.000000 0x3f800000 -// -0.495482 -0xbefdafc7 -// -0.134520 -0xbe09bfba -// -0.400830 -0xbecd3997 -// -0.047935 -0xbd4457e9 -// 0.428835 -0x3edb9052 -// 0.883679 -0x3f6238c4 -// 0.254721 -0x3e826ac4 -// -0.750073 -0xbf4004c9 -// -1.000000 -0xbf800000 -// -1.000000 -0xbf800000 -// 0.153887 -0x3e1d94a4 -// 0.956342 -0x3f74d2d6 -// 0.133443 -0x3e08a537 +// 0.187791 +0x3e404c4b +// -0.185166 +0xbe3d9c1a +// -0.309109 +0xbe9e438f +// 0.180820 +0x3e3928e0 +// 0.606749 +0x3f1b53e8 +// 0.035388 +0x3d10f31f +// 1.000000 +0x3f800000 +// 0.575066 +0x3f133785 +// -0.147401 +0xbe16f046 +// 0.517456 +0x3f047807 +// -0.131620 +0xbe06c771 +// 0.172057 +0x3e302fb2 +// 0.622009 +0x3f1f3bf9 +// -0.438195 +0xbee05b21 // 1.000000 0x3f800000 -// -1.000000 -0xbf800000 -// 0.286657 -0x3e92c4b5 -// 0.740608 -0x3f3d9883 -// 0.276657 -0x3e8da5fa -// -0.135261 -0xbe0a81cb -// -0.041531 -0xbd2a1c65 -// 0.900548 -0x3f668a53 -// -0.086568 -0xbdb14ac5 -// 0.555311 -0x3f0e28e4 -// -0.272279 -0xbe8b6825 -// 0.776666 -0x3f46d398 -// -0.075193 -0xbd99fec1 -// 0.983008 -0x3f7ba66b -// -0.135883 -0xbe0b24db -// 0.932658 -0x3f6ec2a8 -// 0.128069 -0x3e03246e -// -0.092637 -0xbdbdb8aa -// -0.395272 -0xbeca6126 -// -0.483020 -0xbef74e68 -// -0.493562 -0xbefcb439 -// -0.737194 -0xbf3cb8bb -// 0.241812 -0x3e779dad -// -0.374436 -0xbebfb60b -// -0.003724 -0xbb74140c -// 0.075550 -0x3d9ab9ce -// -0.436178 -0xbedf52bc -// 0.006722 -0x3bdc4632 // 1.000000 0x3f800000 -// -0.652489 -0xbf270982 -// -0.316548 -0xbea21297 -// -0.482437 -0xbef701ef -// -0.356192 -0xbeb65edc +// 0.309511 +0x3e9e782d +// 0.565706 +0x3f10d21b +// -0.085347 +0xbdaeca89 +// -0.464682 +0xbeedeac1 +// -0.263483 +0xbe86e74d +// 0.511738 +0x3f030145 +// -0.067385 +0xbd8a0125 +// 0.181040 +0x3e396290 +// 0.057877 +0x3d6d10db +// 0.573825 +0x3f12e631 +// -0.638500 +0xbf2374c0 +// 0.505163 +0x3f015256 +// -0.472829 +0xbef21696 +// 0.314493 +0x3ea10549 +// 0.071930 +0x3d93502a +// 1.000000 +0x3f800000 +// -0.525465 +0xbf0684e7 +// 0.511088 +0x3f02d6aa +// 0.343492 +0x3eafde25 +// -0.801524 +0xbf4d30b3 +// 1.000000 +0x3f800000 +// 0.026629 +0x3cda2572 +// 0.668761 +0x3f2b33e4 +// -0.628458 +0xbf20e299 +// -0.714380 +0xbf36e1a0 +// 0.411890 +0x3ed2e33b +// 0.373619 +0x3ebf4af6 +// 0.523545 +0x3f06070e +// 0.282633 +0x3e90b53f +// -0.174923 +0xbe331f19 +// -0.007010 +0xbbe5b1ef +// -0.079613 +0xbda30c06 +// 1.000000 +0x3f800000 // -1.000000 0xbf800000 -// -0.537246 -0xbf0988f0 -// -0.154000 -0xbe1db24a -// 0.401044 -0x3ecd5598 -// -0.064194 -0xbd837835 -// 0.135919 -0x3e0b2e78 -// -0.206427 -0xbe536194 -// -0.343346 -0xbeafcb0f +// -0.344610 +0xbeb070a9 +// 0.058599 +0x3d70053f +// 0.201163 +0x3e4dfdc9 +// 0.120343 +0x3df67667 +// 0.442523 +0x3ee29260 +// -0.040746 +0xbd26e4c3 +// 0.015589 +0x3c7f6a38 +// 0.248106 +0x3e7e0f9d +// 0.041901 +0x3d2ba0d6 // -1.000000 0xbf800000 +// 0.470341 +0x3ef0d08d +// 0.367631 +0x3ebc3a13 // -1.000000 0xbf800000 -// 0.810755 -0x3f4f8d9f -// -0.055716 -0xbd643694 +// 0.325216 +0x3ea682be +// 0.013054 +0x3c55e1f9 +// -0.120742 +0xbdf74761 +// -0.001310 +0xbaabaecc +// 0.612524 +0x3f1cce5e +// -0.348654 +0xbeb282ba +// -0.395595 +0xbeca8b76 +// 0.358838 +0x3eb7b991 +// -0.573885 +0xbf12ea20 +// -0.058928 +0xbd715e3c +// -0.409574 +0xbed1b3b1 +// -0.556101 +0xbf0e5ca5 +// 0.706652 +0x3f34e720 +// 0.020647 +0x3ca92371 +// -0.280305 +0xbe8f842a // 1.000000 0x3f800000 -// -0.149905 -0xbe1980a7 -// -0.693711 -0xbf319706 -// 0.440345 -0x3ee174e4 -// -0.132039 -0xbe07352a -// 0.255234 -0x3e82ae0e -// 0.940244 -0x3f70b3d7 -// 0.242254 -0x3e78118b -// 0.584487 -0x3f15a0f3 -// -0.352286 -0xbeb45ecd -// 0.542446 -0x3f0addc1 -// 0.922015 -0x3f6c0927 -// -0.291860 -0xbe956eb6 -// -1.000000 -0xbf800000 -// 0.420887 -0x3ed77e8b -// -0.212721 -0xbe59d39d -// -0.126301 -0xbe0154f6 -// -0.464466 -0xbeedce8c -// -0.757766 -0xbf41fcf3 -// -0.719272 -0xbf382234 -// 0.306882 -0x3e9d1fa7 -// 0.456527 -0x3ee9bde9 -// 0.074444 -0x3d987640 // -1.000000 0xbf800000 -// 0.811711 -0x3f4fcc49 -// 0.117568 -0x3df0c786 -// -0.007453 -0xbbf43bd0 -// 0.524351 -0x3f063be1 -// 0.380236 -0x3ec2ae50 -// -0.368739 -0xbebccb5b -// -0.263663 -0xbe86fecd -// -0.330865 -0xbea9671c -// -0.355301 -0xbeb5ea0e -// -0.137054 -0xbe0c57d3 -// -0.277405 -0xbe8e0803 -// 0.084210 -0x3dac7612 +// -0.931017 +0xbf6e5726 +// -0.100229 +0xbdcd44bc +// 0.617014 +0x3f1df499 +// 0.461258 +0x3eec29f6 +// -0.045950 +0xbd3c361f +// 0.578507 +0x3f141901 +// 0.017837 +0x3c921ea0 +// 1.000000 +0x3f800000 +// -0.246056 +0xbe7bf622 +// 0.097858 +0x3dc86998 +// 1.000000 +0x3f800000 +// 0.324241 +0x3ea602fb +// 0.511431 +0x3f02ed26 +// -0.733889 +0xbf3be02e +// 0.647586 +0x3f25c82b +// 0.771988 +0x3f45a107 +// 0.018122 +0x3c94756f +// -0.443468 +0xbee30e39 +// 0.027709 +0x3ce2fddd +// 1.000000 +0x3f800000 +// 0.283996 +0x3e9167ed +// -0.075500 +0xbd9a9f89 +// 0.081879 +0x3da7b068 +// -0.481116 +0xbef654d1 +// 0.378211 +0x3ec1a4d7 +// -0.400417 +0xbecd0378 +// -0.390386 +0xbec7e0ab +// 0.126203 +0x3e013b5d // 1.000000 0x3f800000 +// 0.633901 +0x3f224754 +// -0.666479 +0xbf2a9e5a +// -0.043814 +0xbd337694 +// -0.429737 +0xbedc0681 +// -0.516305 +0xbf042c96 +// -0.603102 +0xbf1a64e7 +// 0.031491 +0x3d00fc6e +// 0.534410 +0x3f08cf1e +// 0.103479 +0x3dd3ece1 +// -0.781604 +0xbf481730 diff --git a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoRefs2_f32.txt b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoRefs2_f32.txt index e3e5a83eb..94532e72c 100755 --- a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoRefs2_f32.txt +++ b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/AllBiquadStereoRefs2_f32.txt @@ -1,266 +1,266 @@ W 132 +// 0.001769 +0x3ae7dc6a +// 0.003276 +0x3b56ad1a +// 0.016841 +0x3c89f6e8 +// 0.009294 +0x3c184498 +// -0.042615 +0xbd2e8ce7 +// -0.006021 +0xbbc54c94 +// 0.004734 +0x3b9b2207 +// 0.001762 +0x3ae6fcee +// 0.013847 +0x3c62dedf +// -0.007373 +0xbbf196ce +// 0.032856 +0x3d069471 +// -0.042356 +0xbd2d7d8d +// 0.078673 +0x3da11f78 +// -0.084440 +0xbdaceeca +// 0.130797 +0x3e05efb2 +// -0.127434 +0xbe027def +// 0.176154 +0x3e3461cb +// -0.153373 +0xbe1d0dda +// 0.212493 +0x3e5997bd +// -0.130638 +0xbe05c5d8 +// 0.233657 +0x3e6f43c1 +// -0.084710 +0xbdad7c61 +// 0.010349 +0x3c298f65 +// -0.002632 +0xbb2c8468 +// 0.045514 +0x3d3a6d14 +// 0.001738 +0x3ae3ddc3 +// 0.080507 +0x3da4e102 +// 0.051425 +0x3d52a350 +// 0.086535 +0x3db13981 +// 0.158371 +0x3e222be9 +// 0.100651 +0x3dce224b +// 0.249925 +0x3e7fec6a +// 0.144454 +0x3e13ebc1 +// 0.234220 +0x3e6fd778 +// 0.168426 +0x3e2c77ce +// 0.114922 +0x3deb5c68 +// 0.141546 +0x3e10f156 +// -0.004830 +0xbb9e4461 +// 0.106673 +0x3dda7722 +// -0.057194 +0xbd6a43c3 +// 0.129507 +0x3e049d74 +// -0.086149 +0xbdb06ee0 +// 0.193405 +0x3e460bde +// -0.132417 +0xbe07983e // 0.020000 0x3ca3d70a -// 0.011234 -0x3c380d8d -// 0.055900 -0x3d64f6e7 -// 0.031085 -0x3cfea6d3 -// 0.072883 -0x3d9543cc -// 0.027615 -0x3ce238d1 -// -0.008955 -0xbc12b8bc -// -0.000405 -0xb9d433a7 -// 0.053821 -0x3d5c7346 -// -0.008490 -0xbc0b195a -// -0.193340 -0xbe45faed -// 0.049234 -0x3d49a9e3 -// 0.513563 -0x3f0378e3 -// -0.164291 -0xbe283bef -// -1.109050 -0xbf8df559 -// 0.378700 -0x3ec1e4fc -// 2.009222 -0x40009718 -// -0.681898 -0xbf2e90e4 -// -3.098030 -0xc0464621 -// 0.982403 -0x3f7b7ebf -// 4.080722 -0x40829547 -// -1.146704 -0xbf92c72f -// -0.013382 -0xbc5b4085 -// -0.008050 -0xbc03e59d -// -0.042899 -0xbd2fb6ba -// -0.025307 -0xbccf519f -// -0.041428 -0xbd29b07c -// -0.009761 -0xbc1fed41 -// 0.002628 -0x3b2c3898 -// 0.064111 -0x3d834c90 -// 0.015366 -0x3c7bc19a -// 0.094655 -0x3dc1da96 -// -0.000976 -0xba7fed63 -// -0.017070 -0xbc8bd574 -// 0.036623 -0x3d160196 -// -0.142240 -0xbe11a765 -// 0.093172 -0x3dbed0f0 -// -0.105422 -0xbdd7e7aa -// 0.044981 -0x3d383dcf -// 0.019934 -0x3ca34d54 -// -0.082501 -0xbda8f659 -// 0.082620 -0x3da93489 -// -0.119776 -0xbdf54d25 -// 0.083897 -0x3dabd24b -// -0.015001 -0xbc75c8af -// -0.020000 -0xbca3d70a -// -0.011961 -0xbc43f9a7 -// 0.013795 -0x3c6203de -// -0.007406 -0xbbf2b03c -// -0.048643 -0xbd473d5d -// 0.020000 -0x3ca3d70a -// -0.020000 -0xbca3d70a -// 0.075914 -0x3d9b78d8 -// -0.055369 -0xbd62ca5f -// 0.162109 -0x3e25fff0 -// -0.087187 -0xbdb28ef9 -// 0.301184 -0x3e9a34d1 -// -0.133902 -0xbe091d90 -// 0.474970 -0x3ef32f44 -// -0.135893 -0xbe0b278f -// 0.621514 -0x3f1f1b8a -// -0.044669 -0xbd36f73d -// 0.746168 -0x3f3f04e3 -// 0.110470 -0x3de23de8 -// 0.832243 -0x3f550dde -// 0.383311 -0x3ec4415f -// 0.002561 -0x3b27dcb6 -// -0.001853 -0xbaf2d7e4 -// 0.016286 -0x3c8569dd -// -0.027159 -0xbcde7c77 -// 0.023050 -0x3cbcd362 -// -0.183804 -0xbe3c3722 -// -0.120717 -0xbdf73a80 -// -0.769313 -0xbf44f1b4 -// -0.705511 -0xbf349c5a -// -2.244718 -0xc00fa974 -// -1.904387 -0xbff3c2f2 -// -4.877386 -0xc09c138c -// -3.425609 -0xc05b3d2e -// -8.259460 -0xc10426c0 -// -4.592662 -0xc092f716 -// -11.387343 -0xc136328f -// -4.868969 -0xc09bce97 -// -13.581676 -0xc1594e8b -// -4.313825 -0xc08a0adb -// -15.353149 -0xc175a67f -// -3.625409 -0xc06806b5 -// -17.998041 -0xc18ffbfd -// 0.002718 -0x3b322700 -// -0.004129 -0xbb8748b1 -// 0.008925 -0x3c12386f -// -0.043983 -0xbd3427cc -// -0.025665 -0xbcd23f35 -// -0.151948 -0xbe1b9858 -// -0.001114 -0xba920e74 -// 0.020000 -0x3ca3d70a -// -0.002224 -0xbb11c874 -// -0.027759 -0xbce36786 -// 0.004722 -0x3b9ab905 -// 0.117670 -0x3df0fd01 -// -0.012871 -0xbc52df41 -// -0.141039 -0xbe106c81 -// 0.045150 -0x3d38eee2 -// 0.359069 -0x3eb7d7e5 -// -0.053628 -0xbd5ba88b -// -0.340209 -0xbeae2fd1 -// 0.170905 -0x3e2f01be -// 0.680563 -0x3f2e3967 -// -0.180991 -0xbe3955ce -// -0.477400 -0xbef46dc6 -// -0.004254 -0xbb8b68b7 -// -0.002526 -0xbb258b78 -// -0.016652 -0xbc886a6a -// -0.019527 -0xbc9ff714 -// -0.062913 -0xbd80d8c2 -// -0.039359 -0xbd21368c -// -0.132137 -0xbe074ee7 -// -0.130513 -0xbe05a51d -// -0.316513 -0xbea20e09 -// -0.157788 -0xbe21933c -// -0.465959 -0xbeee9221 -// -0.336363 -0xbeac37ca -// -0.846801 -0xbf58c7f2 -// -0.256820 -0xbe837de3 -// -0.993027 -0xbf7e3707 -// -0.389138 -0xbec73d0a -// -1.428914 -0xbfb6e6a5 -// -0.106705 -0xbdda8855 -// -1.477528 -0xbfbd1fa2 -// -0.076535 -0xbd9cbe2c -// -1.685673 -0xbfd7c425 -// 0.279158 -0x3e8eedc2 +// -0.010509 +0xbc2c2f3c +// 0.083206 +0x3daa680a +// -0.031481 +0xbd00f237 +// 0.136475 +0x3e0bbffd +// -0.015466 +0xbc7d64c3 +// 0.000533 +0x3a0b9d16 +// 0.013375 +0x3c5b23b3 +// -0.010707 +0xbc2f6e59 +// 0.032467 +0x3d04fba7 +// -0.032931 +0xbd06e2d4 +// 0.027033 +0x3cdd73c2 +// -0.023462 +0xbcc03408 +// 0.022475 +0x3cb81c84 +// 0.017265 +0x3c8d6e8f +// 0.049003 +0x3d48b779 +// 0.027164 +0x3cde8711 +// 0.093786 +0x3dc012ae +// -0.020278 +0xbca61de9 +// 0.145370 +0x3e14dbf7 +// -0.091577 +0xbdbb8c98 +// 0.155573 +0x3e1f4e7a +// 0.002407 +0x3b1dbc6b +// 0.008850 +0x3c110185 +// -0.011104 +0xbc35eeb9 +// -0.037524 +0xbd19b2da +// 0.021992 +0x3cb4285d +// 0.049316 +0x3d49ffe1 +// -0.042897 +0xbd2fb4e7 +// 0.018252 +0x3c9584c2 +// 0.098282 +0x3dc947e1 +// -0.134240 +0xbe097623 +// -0.112608 +0xbde69ee7 +// 0.179632 +0x3e37f182 +// -0.050841 +0xbd503e68 +// -0.070077 +0xbd8f8455 +// 0.256241 +0x3e8331fc +// -0.148710 +0xbe18477c +// -0.206155 +0xbe531a6a +// 0.252203 +0x3e8120c5 +// -0.028113 +0xbce64c47 +// -0.080866 +0xbda59d49 +// 0.161414 +0x3e2549ba +// -0.155758 +0xbe1f7f25 +// 0.014133 +0x3c678e3d +// 0.000413 +0x39d87f49 +// 0.084651 +0x3dad5d5c +// 0.022637 +0x3cb97172 +// 0.190052 +0x3e429cfa +// 0.116288 +0x3dee2830 +// -0.002005 +0xbb035f31 +// 0.012340 +0x3c4a2ed8 +// 0.001379 +0x3ab4b131 +// 0.047385 +0x3d4216bc +// 0.040846 +0x3d274e86 +// 0.038831 +0x3d1f0cd6 +// 0.109656 +0x3de0934c +// -0.086167 +0xbdb0787f +// 0.089274 +0x3db6d568 +// -0.170795 +0xbe2ee4c7 +// -0.114022 +0xbde98473 +// 0.010343 +0x3c297795 +// -0.350637 +0xbeb386ad +// 0.260901 +0x3e8594c9 +// -0.334898 +0xbeab77b2 +// 0.175235 +0x3e3370b8 +// -0.008869 +0xbc1150c8 +// 0.000554 +0x3a114650 +// 0.068364 +0x3d8c02af +// 0.002658 +0x3b2e31ad +// -0.273895 +0xbe8c3c03 +// -0.019130 +0xbc9cb672 +// 0.766872 +0x3f4451b6 +// 0.078237 +0x3da03aae +// -1.667028 +0xbfd5612b +// -0.226192 +0xbe679ec4 +// 2.959857 +0x403d6e4b +// 0.549945 +0x3f0cc92a +// -4.393206 +0xc08c9525 +// -1.163271 +0xbf94e611 +// 5.463283 +0x40aed336 +// 2.190424 +0x400c2fe8 +// -5.541438 +0xc0b15376 +// -3.680836 +0xc06b92d0 +// 4.127624 +0x40841580 +// 5.522989 +0x40b0bc53 +// -1.129602 +0xbf9096d0 +// -7.380613 +0xc0ec2dfc diff --git a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadInput1_f32.txt b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadInput1_f32.txt index f4932288c..83c4dd5d1 100755 --- a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadInput1_f32.txt +++ b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadInput1_f32.txt @@ -1,202 +1,202 @@ W 100 -// -0.029936 -0xbcf53bc7 -// 0.284509 -0x3e91ab21 -// 0.668647 -0x3f2b2c74 -// 0.306880 -0x3e9d1f6b -// 0.213973 -0x3e5b1bd3 -// 0.538225 -0x3f09c922 -// 0.766250 -0x3f4428f3 -// 0.563234 -0x3f103015 -// 0.112109 -0x3de599a3 -// -0.020372 -0xbca6e341 -// -0.042498 -0xbd2e1214 -// -0.016551 -0xbc87968f -// -0.168763 -0xbe2cd052 -// -0.610973 -0xbf1c68c2 -// -0.835429 -0xbf55dea8 -// -0.638178 -0xbf235faa -// -0.318169 -0xbea2e717 -// -0.268756 -0xbe899a6f -// -0.400647 -0xbecd218b -// -0.380073 -0xbec298f8 -// -0.021168 -0xbcad67b9 -// 0.535375 -0x3f090e58 -// 0.548437 -0x3f0c6656 -// 0.420556 -0x3ed75328 -// 0.390134 -0x3ec7bfac -// 0.561865 -0x3f0fd65f -// 0.685807 -0x3f2f9107 -// 0.536016 -0x3f093857 -// 0.159308 -0x3e232195 -// 0.003765 -0x3b76b844 -// 0.156077 -0x3e1fd2af -// 0.181969 -0x3e3a5613 -// -0.368482 -0xbebca9b8 -// -0.605390 -0xbf1afad6 -// -0.777347 -0xbf47003b -// -0.556542 -0xbf0e7990 -// -0.451493 -0xbee72a14 -// -0.323351 -0xbea58e41 -// -0.463146 -0xbeed2177 -// -0.353012 -0xbeb4be03 -// 0.174874 -0x3e331239 -// 0.399463 -0x3ecc8678 -// 0.404406 -0x3ecf0e59 -// 0.254541 -0x3e825328 -// 0.455669 -0x3ee94d66 -// 0.860756 -0x3f5c5a80 -// 0.585422 -0x3f15de38 -// 0.568229 -0x3f11777b -// -0.103649 -0xbdd445fa -// -0.044666 -0xbd36f3c5 -// 0.276870 -0x3e8dc1e1 -// -0.181632 -0xbe39fdc0 -// -0.381814 -0xbec37d10 -// -0.617524 -0xbf1e1615 -// -0.509072 -0xbf025288 -// -0.454603 -0xbee8c1b9 -// -0.260066 -0xbe852759 -// -0.569666 -0xbf11d5a3 -// -0.268410 -0xbe896cfa -// -0.266821 -0xbe889cbe -// 0.137461 -0x3e0cc29d -// 0.464295 -0x3eedb816 -// 0.189090 -0x3e41a0d4 -// 0.505298 -0x3f015b2f -// 0.462849 -0x3eecfa87 -// 0.808854 -0x3f4f110d -// 0.700242 -0x3f33430d -// 0.584979 -0x3f15c127 -// -0.081238 -0xbda65fed -// -0.004254 -0xbb8b684e -// -0.014496 -0xbc6d801f -// -0.298948 -0xbe990fb9 -// -0.619392 -0xbf1e907d -// -1.000000 -0xbf800000 -// -0.529186 -0xbf0778bf -// -0.422518 -0xbed8543d -// -0.219093 -0xbe605a08 -// -0.475159 -0xbef34813 -// -0.340739 -0xbeae7557 -// -0.209597 -0xbe56a0a4 -// 0.298132 -0x3e98a4c2 -// 0.465727 -0x3eee73cf -// 0.361978 -0x3eb95539 -// 0.136394 -0x3e0baadd -// 0.374122 -0x3ebf8ced -// 0.536019 -0x3f09388c -// 0.623578 -0x3f1fa2cb -// 0.434130 -0x3ede4653 -// 0.117249 -0x3df02037 -// 0.199612 -0x3e4c6717 -// -0.080717 -0xbda54f14 -// -0.139196 -0xbe0e8987 -// -0.590724 -0xbf1739b0 -// -0.677539 -0xbf2d733a -// -0.477806 -0xbef4a308 -// -0.287157 -0xbe930645 -// -0.475920 -0xbef3abd9 -// -0.179729 -0xbe380acc -// -0.342610 -0xbeaf6a8e -// 0.096826 -0x3dc64ce8 +// -0.058198 +0xbd6e6135 +// 0.542090 +0x3f0ac668 +// 0.394593 +0x3eca0813 +// 0.239908 +0x3e75aa8c +// 0.313652 +0x3ea09703 +// 0.382391 +0x3ec3c8c8 +// 0.780721 +0x3f47dd58 +// 0.721098 +0x3f3899e3 +// 0.105363 +0x3dd7c8b1 +// 0.147942 +0x3e177e21 +// -0.138040 +0xbe0d5a4f +// -0.006769 +0xbbddce44 +// -0.142735 +0xbe12291f +// -0.648427 +0xbf25ff4f +// -0.811666 +0xbf4fc955 +// -0.617589 +0xbf1e1a51 +// -0.224564 +0xbe65f3fa +// -0.360722 +0xbeb8b09e +// -0.568707 +0xbf1196c7 +// -0.478976 +0xbef53c4c +// 0.123487 +0x3dfce69d +// 0.655571 +0x3f27d37c +// 0.488235 +0x3ef9f9e7 +// 0.355716 +0x3eb6205a +// 0.402827 +0x3ece3f50 +// 0.766138 +0x3f44219d +// 0.779081 +0x3f4771dc +// 0.577306 +0x3f13ca4e +// 0.088456 +0x3db5286f +// -0.272044 +0xbe8b4965 +// -0.146637 +0xbe16281e +// -0.145512 +0xbe150138 +// -0.401513 +0xbecd9315 +// -0.747423 +0xbf3f571c +// -0.885627 +0xbf62b879 +// -0.562746 +0xbf101019 +// -0.399372 +0xbecc7a6c +// -0.495452 +0xbefdabde +// -0.682028 +0xbf2e9968 +// -0.282652 +0xbe90b7bd +// 0.424439 +0x3ed9501c +// 0.522086 +0x3f05a773 +// 0.408502 +0x3ed1273a +// 0.457581 +0x3eea4810 +// 0.329377 +0x3ea8a40c +// 0.788664 +0x3f49e5db +// 0.800642 +0x3f4cf6de +// 0.236911 +0x3e7298b7 +// 0.247968 +0x3e7deb67 +// -0.032999 +0xbd0729ab +// -0.051062 +0xbd5126bb +// -0.095968 +0xbdc48b16 +// -0.476905 +0xbef42ced +// -0.883218 +0xbf621a94 +// -0.756280 +0xbf419b8e +// -0.340354 +0xbeae42d2 +// -0.147683 +0xbe173a2e +// -0.445798 +0xbee43f9b +// -0.729152 +0xbf3aa9ae +// -0.223870 +0xbe653e12 +// 0.300510 +0x3e99dc63 +// 0.464516 +0x3eedd4fd +// 0.249595 +0x3e7f95cd +// 0.368075 +0x3ebc7462 +// 0.611150 +0x3f1c7453 +// 1.000000 +0x3f800000 +// 0.953099 +0x3f73fe4a +// 0.114019 +0x3de982e8 +// -0.130405 +0xbe0588e9 +// -0.206464 +0xbe536b5d +// -0.121584 +0xbdf90107 +// -0.158005 +0xbe21cc07 +// -0.475983 +0xbef3b410 +// -0.790303 +0xbf4a5148 +// -0.844797 +0xbf5844a2 +// -0.445148 +0xbee3ea7b +// -0.322243 +0xbea4fd04 +// -0.324206 +0xbea5fe5b +// -0.562453 +0xbf0ffce8 +// -0.293915 +0xbe967c12 +// 0.357814 +0x3eb7335b +// 0.485007 +0x3ef852e6 +// 0.571161 +0x3f123794 +// 0.356639 +0x3eb69961 +// 0.450283 +0x3ee68b7d +// 0.814540 +0x3f5085af +// 0.594664 +0x3f183bef +// 0.511423 +0x3f02ec9e +// -0.139750 +0xbe0f1abd +// -0.046449 +0xbd3e41c1 +// 0.022215 +0x3cb5fccd +// -0.312890 +0xbea0330e +// -0.545489 +0xbf0ba524 +// -0.732840 +0xbf3b9b61 +// -0.563232 +0xbf102ff3 +// -0.334027 +0xbeab058d +// -0.284090 +0xbe917431 +// -0.478688 +0xbef5168a +// -0.290333 +0xbe94a697 +// -0.059755 +0xbd74c152 diff --git a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadOutput1_f32.txt b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadOutput1_f32.txt index bb03985e6..be322b29f 100755 --- a/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadOutput1_f32.txt +++ b/Testing/Patterns/DSP/Filtering/BIQUAD/BIQUADF32/BiquadOutput1_f32.txt @@ -1,202 +1,202 @@ W 100 -// -0.000599 -0xba1cf30f -// 0.005226 -0x3bab3ad5 -// 0.016770 -0x3c896159 -// 0.024694 -0x3cca4ba9 -// 0.044170 -0x3d34eb78 -// 0.074355 -0x3d98474d -// 0.109367 -0x3ddffb9d -// 0.145884 -0x3e156293 -// 0.182184 -0x3e3a8e79 -// 0.218158 -0x3e5f64c3 -// 0.242754 -0x3e78947c -// 0.251286 -0x3e80a895 -// 0.237083 -0x3e72c5d4 -// 0.194167 -0x3e46d3d5 -// 0.125929 -0x3e00f3a8 -// 0.035255 -0x3d10671d -// -0.074270 -0xbd981b15 -// -0.195479 -0xbe482bae -// -0.314589 -0xbea111c9 -// -0.416489 -0xbed53e19 -// -0.487592 -0xbef9a5b1 -// -0.516933 -0xbf0455b7 -// -0.505346 -0xbf015e56 -// -0.444061 -0xbee35bf0 -// -0.337053 -0xbeac923f -// -0.193626 -0xbe4645ec -// -0.029830 -0xbcf45f15 -// 0.136365 -0x3e0ba33a -// 0.287256 -0x3e93132a -// 0.410479 -0x3ed22a4d -// 0.493364 -0x3efc9a2d -// 0.523950 -0x3f06219a -// 0.494473 -0x3efd2b97 -// 0.419690 -0x3ed6e1a9 -// 0.299752 -0x3e997914 -// 0.153093 -0x3e1cc471 -// -0.010725 -0xbc2fb69f -// -0.170172 -0xbe2e418b -// -0.314925 -0xbea13de4 -// -0.425629 -0xbed9ebfe -// -0.490768 -0xbefb45e4 -// -0.513210 -0xbf0361b8 -// -0.487922 -0xbef9d0de -// -0.419595 -0xbed6d520 -// -0.310220 -0xbe9ed526 -// -0.171695 -0xbe2fd0ef -// -0.027309 -0xbcdfb793 -// 0.125358 -0x3e005ddd -// 0.253911 -0x3e82009b -// 0.365636 -0x3ebb3497 -// 0.442757 -0x3ee2b0ff -// 0.466849 -0x3eef06e1 -// 0.452471 -0x3ee7aa3f -// 0.392128 -0x3ec8c4f8 -// 0.297008 -0x3e98116d -// 0.171039 -0x3e2f24f4 -// 0.032305 -0x3d045273 -// -0.115669 -0xbdece40e -// -0.242103 -0xbe77e9f8 -// -0.350754 -0xbeb39607 -// -0.417876 -0xbed5f3cd -// -0.442701 -0xbee2a9b4 -// -0.429332 -0xbedbd167 -// -0.362003 -0xbeb9586a -// -0.264328 -0xbe8755f2 -// -0.131543 -0xbe06b345 -// 0.011559 -0x3c3d616e -// 0.159848 -0x3e23af4b -// 0.286903 -0x3e92e4fb -// 0.397047 -0x3ecb49ba -// 0.465086 -0x3eee1fbb -// 0.484306 -0x3ef7f6fe -// 0.454901 -0x3ee8e8ca -// 0.374406 -0x3ebfb232 -// 0.262631 -0x3e867787 -// 0.113661 -0x3de8c715 -// -0.045224 -0xbd393c7a -// -0.207083 -0xbe540d98 -// -0.343815 -0xbeb00880 -// -0.449561 -0xbee62ce6 -// -0.504616 -0xbf012e85 -// -0.510836 -0xbf02c62a -// -0.464376 -0xbeedc2b5 -// -0.371376 -0xbebe2501 -// -0.236285 -0xbe71f4af -// -0.081845 -0xbda79e2f -// 0.079134 -0x3da2110d -// 0.227988 -0x3e6975ac -// 0.350809 -0x3eb39d35 -// 0.442529 -0x3ee29319 -// 0.483646 -0x3ef7a07e -// 0.482724 -0x3ef72790 -// 0.430624 -0x3edc7ab2 -// 0.344373 -0x3eb051b3 -// 0.230957 -0x3e6c7fec -// 0.100415 -0x3dcda67d -// -0.038467 -0xbd1d8fcf -// -0.159872 -0xbe23b57d -// -0.269742 -0xbe8a1b97 -// -0.341214 -0xbeaeb3a0 +// -0.001164 +0xba989022 +// 0.009938 +0x3c22d4ed +// 0.014325 +0x3c6ab3b7 +// 0.026447 +0x3cd8a6db +// 0.046917 +0x3d402c09 +// 0.071278 +0x3d91fa37 +// 0.106973 +0x3ddb14ad +// 0.143048 +0x3e127b36 +// 0.175339 +0x3e338c2a +// 0.214607 +0x3e5bc1f4 +// 0.236436 +0x3e721c3e +// 0.249311 +0x3e7f4b5d +// 0.238187 +0x3e73e756 +// 0.198201 +0x3e4af526 +// 0.135420 +0x3e0aab9c +// 0.048941 +0x3d487607 +// -0.055413 +0xbd62f858 +// -0.176853 +0xbe3518ff +// -0.297391 +0xbe9843a0 +// -0.403211 +0xbece719f +// -0.478717 +0xbef51a73 +// -0.516926 +0xbf04554b +// -0.515222 +0xbf03e596 +// -0.460477 +0xbeebc3a7 +// -0.358128 +0xbeb75c9b +// -0.214356 +0xbe5b8009 +// -0.049683 +0xbd4b80bd +// 0.123818 +0x3dfd946b +// 0.283824 +0x3e915152 +// 0.414327 +0x3ed422aa +// 0.503174 +0x3f00cffe +// 0.532451 +0x3f084eba +// 0.499291 +0x3effa30e +// 0.407859 +0x3ed0d2da +// 0.268743 +0x3e8998b4 +// 0.100049 +0x3dcce6c0 +// -0.086419 +0xbdb0fc60 +// -0.269137 +0xbe89cc45 +// -0.428412 +0xbedb58cc +// -0.540354 +0xbf0a549e +// -0.596096 +0xbf1899bf +// -0.598814 +0xbf194bda +// -0.541221 +0xbf0a8d7a +// -0.428186 +0xbedb3b2f +// -0.280321 +0xbe8f8645 +// -0.100336 +0xbdcd7ce9 +// 0.080527 +0x3da4eb3a +// 0.244989 +0x3e7ade48 +// 0.392384 +0x3ec8e696 +// 0.493160 +0x3efc7f7b +// 0.549398 +0x3f0ca557 +// 0.553692 +0x3f0dbec8 +// 0.503610 +0x3f00ec9d +// 0.407536 +0x3ed0a897 +// 0.280520 +0x3e8fa05d +// 0.132451 +0x3e07a14e +// -0.024987 +0xbcccb098 +// -0.179232 +0xbe3788a6 +// -0.312998 +0xbea0413c +// -0.407195 +0xbed07be5 +// -0.463578 +0xbeed5a21 +// -0.477034 +0xbef43dbd +// -0.446411 +0xbee49008 +// -0.367328 +0xbebc1261 +// -0.252391 +0xbe813967 +// -0.108042 +0xbddd452d +// 0.048075 +0x3d44e9e7 +// 0.195691 +0x3e486353 +// 0.336084 +0x3eac1331 +// 0.443559 +0x3ee31a1e +// 0.509626 +0x3f0276d5 +// 0.526027 +0x3f06a9ae +// 0.488941 +0x3efa5673 +// 0.402781 +0x3ece3942 +// 0.275364 +0x3e8cfc7b +// 0.122032 +0x3df9ebb5 +// -0.049504 +0xbd4ac505 +// -0.216135 +0xbe5d529c +// -0.364610 +0xbebaae24 +// -0.471010 +0xbef1282d +// -0.525453 +0xbf068410 +// -0.531071 +0xbf07f43f +// -0.476865 +0xbef427a9 +// -0.375566 +0xbec04a2b +// -0.231177 +0xbe6cb9b7 +// -0.059509 +0xbd73c014 +// 0.111672 +0x3de4b443 +// 0.277834 +0x3e8e404d +// 0.407734 +0x3ed0c283 +// 0.506671 +0x3f01b52b +// 0.552920 +0x3f0d8c2c +// 0.540695 +0x3f0a6af5 +// 0.479536 +0x3ef585bf +// 0.372249 +0x3ebe976a +// 0.234340 +0x3e6ff6ed +// 0.077152 +0x3d9e0204 +// -0.084152 +0xbdac57ea +// -0.235079 +0xbe70b891 +// -0.354168 +0xbeb5558a +// -0.437210 +0xbedfd9f8 diff --git a/Testing/Source/Tests/BIQUADF32.cpp b/Testing/Source/Tests/BIQUADF32.cpp index 95176020a..bde546144 100755 --- a/Testing/Source/Tests/BIQUADF32.cpp +++ b/Testing/Source/Tests/BIQUADF32.cpp @@ -10,8 +10,7 @@ Reference patterns are generated with a double precision computation. */ -#define REL_ERROR (1.2e-3) - +#define REL_ERROR (2.0e-4) void BIQUADF32::test_biquad_cascade_df1_ref() { @@ -118,9 +117,12 @@ a double precision computation. The filter is initialized with the coefs, blockSize and numTaps. */ -#if !defined(ARM_MATH_NEON) +// Neon disabled because this filter has issues with Neon. +// So test changed to use the scalar version +//#if !defined(ARM_MATH_NEON) arm_biquad_cascade_df2T_init_f32(&this->Sdf2T,3,coefsp,statep); -#else +#if 0 +//#else float32_t *vecCoefsPtr = vecCoefs.ptr(); // Those Neon coefs must be computed from original coefs @@ -244,11 +246,13 @@ a double precision computation. float32_t *statep = state.ptr(); const int16_t *configsp = configs.ptr(); -#if !defined(ARM_MATH_NEON) +// Neon version has issues and is disabled. +// So the test is not using Neon version +//#if !defined(ARM_MATH_NEON) const float32_t *coefsp = coefs.ptr(); -#else - float32_t *coefsp = coefs.ptr(); -#endif +//#else +// float32_t *coefsp = coefs.ptr(); +//#endif const float32_t *inputp = inputs.ptr(); float32_t *outp = output.ptr(); @@ -284,9 +288,10 @@ a double precision computation. The filter is initialized with the coefs, blockSize and numTaps. */ -#if !defined(ARM_MATH_NEON) +//#if !defined(ARM_MATH_NEON) arm_biquad_cascade_df2T_init_f32(&this->Sdf2T,numStages,coefsp,statep); -#else +//#else +#if 0 float32_t *vecCoefsPtr = vecCoefs.ptr(); // Those Neon coefs must be computed from original coefs diff --git a/Testing/Source/Tests/BasicTestsF32.cpp b/Testing/Source/Tests/BasicTestsF32.cpp index 8b7c0d9a8..3a77e2d28 100644 --- a/Testing/Source/Tests/BasicTestsF32.cpp +++ b/Testing/Source/Tests/BasicTestsF32.cpp @@ -25,7 +25,7 @@ float32_t *outp=output.ptr(); ASSERT_EMPTY_TAIL(output); - ASSERT_SNR(output,ref,(float32_t)SNR_THRESHOLD); + ASSERT_SNR(output,ref,(double)SNR_THRESHOLD); ASSERT_REL_ERROR(output,ref,REL_ERROR); diff --git a/Testing/Source/Tests/FastMathF16.cpp b/Testing/Source/Tests/FastMathF16.cpp index ad0a33371..d320d406c 100755 --- a/Testing/Source/Tests/FastMathF16.cpp +++ b/Testing/Source/Tests/FastMathF16.cpp @@ -108,7 +108,7 @@ a double precision computation. arm_vlog_f16(inp,outp,ref.nbSamples()); - //ASSERT_SNR(ref,output,(float16_t)SNR_THRESHOLD); + ASSERT_SNR(ref,output,SNR_THRESHOLD); ASSERT_CLOSE_ERROR(ref,output,ABS_ERROR,REL_ERROR); ASSERT_EMPTY_TAIL(output); diff --git a/Testing/Source/Tests/TransformRF16.cpp b/Testing/Source/Tests/TransformRF16.cpp index 82d2e5fe1..0e9764e52 100755 --- a/Testing/Source/Tests/TransformRF16.cpp +++ b/Testing/Source/Tests/TransformRF16.cpp @@ -53,7 +53,7 @@ static double abs_err,rel_err; // To investigate ... for(unsigned int i=0;i") if passed != 1: - print("%s at line %d" % (errorStr(theError), theLine)) if (len(errorDetail)>0): print("" + errorDetail + "") @@ -578,6 +577,7 @@ def analyze(root,results,args,trace): parser.add_argument('-b', nargs='?',type = str, default="FullBenchmark", help="Full Benchmark dir path") parser.add_argument('-m', action='store_true', help="Mathematica output") parser.add_argument('-t', nargs='?',type = str, default=None, help="External trace file") +parser.add_argument('--noerr', action='store_true', help="Exit code forced to 0") args = parser.parse_args() @@ -601,7 +601,10 @@ def analyze(root,results,args,trace): with open(args.r,"r") as results: extractDataFiles(results,args.o) - sys.exit(resultStatus) + if args.noerr: + sys.exit(0) + else: + sys.exit(resultStatus) else: parser.print_help() \ No newline at end of file diff --git a/Testing/testmain.cpp b/Testing/testmain.cpp index 2e49b16f5..ec1f7ec84 100644 --- a/Testing/testmain.cpp +++ b/Testing/testmain.cpp @@ -47,7 +47,7 @@ int testmain(const char *patterns) // There is also possibility of using "FPGA" io #if defined(EMBEDDED) - Client::FPGA io((const char*)testDesc,(const char*)patterns); + Client::FPGA io((const unsigned char*)testDesc,(const char*)patterns); #else Client::Semihosting io("../TestDesc.txt","../Patterns","../Output","../Parameters"); #endif diff --git a/vcpkg-neon-configuration.json b/vcpkg-neon-configuration.json new file mode 100644 index 000000000..58733727f --- /dev/null +++ b/vcpkg-neon-configuration.json @@ -0,0 +1,14 @@ +{ + "registries": [ + { + "name": "arm", + "kind": "artifact", + "location": "https://artifacts.tools.arm.com/vcpkg-registry" + } + ], + "requires": { + "arm:tools/kitware/cmake": "3.28.4", + "arm:tools/ninja-build/ninja": "1.12.0", + } +} +