-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathDownsampler2x8F64Avx512.h
134 lines (72 loc) · 3.55 KB
/
Downsampler2x8F64Avx512.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
/*****************************************************************************
Downsampler2x8F64Avx512.h
Author: Laurent de Soras, 2020
Downsamples vectors of 8 double by a factor 2 the input signal, using AVX
instruction set.
This object must be aligned on a 64-byte boundary!
Template parameters:
- NC: number of coefficients, > 0
--- Legal stuff ---
This program is free software. It comes without any warranty, to
the extent permitted by applicable law. You can redistribute it
and/or modify it under the terms of the Do What The Fuck You Want
To Public License, Version 2, as published by Sam Hocevar. See
http://sam.zoy.org/wtfpl/COPYING for more details.
*Tab=3***********************************************************************/
#pragma once
#if ! defined (hiir_Downsampler2x8F64Avx512_HEADER_INCLUDED)
#define hiir_Downsampler2x8F64Avx512_HEADER_INCLUDED
#if defined (_MSC_VER)
#pragma warning (4 : 4250)
#endif
/*\\\ INCLUDE FILES \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
#include "hiir/def.h"
#include "hiir/StageDataF64Avx512.h"
#include <immintrin.h>
#include <array>
namespace hiir
{
template <int NC>
class Downsampler2x8F64Avx512
{
static_assert ((NC > 0), "Number of coefficient must be positive.");
/*\\\ PUBLIC \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
public:
typedef double DataType;
static const int _nbr_chn = 8;
enum { NBR_COEFS = NC };
Downsampler2x8F64Avx512 ();
Downsampler2x8F64Avx512 (const Downsampler2x8F64Avx512 <NC> &other) = default;
Downsampler2x8F64Avx512 (Downsampler2x8F64Avx512 <NC> &&other) = default;
~Downsampler2x8F64Avx512 () = default;
Downsampler2x8F64Avx512 <NC> &
operator = (const Downsampler2x8F64Avx512 <NC> &other) = default;
Downsampler2x8F64Avx512 <NC> &
operator = (Downsampler2x8F64Avx512 <NC> &&other) = default;
void set_coefs (const double coef_arr []);
hiir_FORCEINLINE __m512d
process_sample (const double in_ptr [_nbr_chn * 2]);
hiir_FORCEINLINE __m512d
process_sample (__m512d in_0, __m512d in_1);
void process_block (double out_ptr [], const double in_ptr [], long nbr_spl);
hiir_FORCEINLINE void
process_sample_split (__m512d &low, __m512d &high, const double in_ptr [_nbr_chn * 2]);
hiir_FORCEINLINE void
process_sample_split (__m512d &low, __m512d &high, __m512d in_0, __m512d in_1);
void process_block_split (double out_l_ptr [], double out_h_ptr [], const double in_ptr [], long nbr_spl);
void clear_buffers ();
/*\\\ PROTECTED \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
protected:
/*\\\ PRIVATE \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
typedef std::array <StageDataF64Avx512, NBR_COEFS + 2> Filter; // Stages 0 and 1 contain only input memories
Filter _filter; // Should be the first member (thus easier to align)
/*\\\ FORBIDDEN MEMBER FUNCTIONS \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
bool operator == (const Downsampler2x8F64Avx512 <NC> &other) const = delete;
bool operator != (const Downsampler2x8F64Avx512 <NC> &other) const = delete;
}; // class Downsampler2x8F64Avx512
} // namespace hiir
#include "hiir/Downsampler2x8F64Avx512.hpp"
#endif // hiir_Downsampler2x8F64Avx512_HEADER_INCLUDED
/*\\\ EOF \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/