-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathDownsampler2x4F64Avx.h
135 lines (73 loc) · 3.57 KB
/
Downsampler2x4F64Avx.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
/*****************************************************************************
Downsampler2x4F64Avx.h
Port of Downsampler2x4Sse.h from float to double by Dario Mambro
Downsampler2x4Sse.h by Laurent de Soras, 2015
Downsamples vectors of 4 double by a factor 2 the input signal, using AVX
instruction set.
This object must be aligned on a 32-byte boundary!
Template parameters:
- NC: number of coefficients, > 0
--- Legal stuff ---
This program is free software. It comes without any warranty, to
the extent permitted by applicable law. You can redistribute it
and/or modify it under the terms of the Do What The Fuck You Want
To Public License, Version 2, as published by Sam Hocevar. See
http://sam.zoy.org/wtfpl/COPYING for more details.
*Tab=3***********************************************************************/
#pragma once
#if ! defined (hiir_Downsampler2x4F64Avx_HEADER_INCLUDED)
#define hiir_Downsampler2x4F64Avx_HEADER_INCLUDED
#if defined (_MSC_VER)
#pragma warning (4 : 4250)
#endif
/*\\\ INCLUDE FILES \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
#include "hiir/def.h"
#include "hiir/StageDataF64Avx.h"
#include <immintrin.h>
#include <array>
namespace hiir
{
template <int NC>
class Downsampler2x4F64Avx
{
static_assert ((NC > 0), "Number of coefficient must be positive.");
/*\\\ PUBLIC \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
public:
typedef double DataType;
static const int _nbr_chn = 4;
enum { NBR_COEFS = NC };
Downsampler2x4F64Avx ();
Downsampler2x4F64Avx (const Downsampler2x4F64Avx <NC> &other) = default;
Downsampler2x4F64Avx (Downsampler2x4F64Avx <NC> &&other) = default;
~Downsampler2x4F64Avx () = default;
Downsampler2x4F64Avx <NC> &
operator = (const Downsampler2x4F64Avx <NC> &other) = default;
Downsampler2x4F64Avx <NC> &
operator = (Downsampler2x4F64Avx <NC> &&other) = default;
void set_coefs (const double coef_arr []);
hiir_FORCEINLINE __m256d
process_sample (const double in_ptr [_nbr_chn * 2]);
hiir_FORCEINLINE __m256d
process_sample (__m256d in_0, __m256d in_1);
void process_block (double out_ptr [], const double in_ptr [], long nbr_spl);
hiir_FORCEINLINE void
process_sample_split (__m256d &low, __m256d &high, const double in_ptr [_nbr_chn * 2]);
hiir_FORCEINLINE void
process_sample_split (__m256d &low, __m256d &high, __m256d in_0, __m256d in_1);
void process_block_split (double out_l_ptr [], double out_h_ptr [], const double in_ptr [], long nbr_spl);
void clear_buffers ();
/*\\\ PROTECTED \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
protected:
/*\\\ PRIVATE \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
typedef std::array <StageDataF64Avx, NBR_COEFS + 2> Filter; // Stages 0 and 1 contain only input memories
Filter _filter; // Should be the first member (thus easier to align)
/*\\\ FORBIDDEN MEMBER FUNCTIONS \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
bool operator == (const Downsampler2x4F64Avx <NC> &other) const = delete;
bool operator != (const Downsampler2x4F64Avx <NC> &other) const = delete;
}; // class Downsampler2x4F64Avx
} // namespace hiir
#include "hiir/Downsampler2x4F64Avx.hpp"
#endif // hiir_Downsampler2x4F64Avx_HEADER_INCLUDED
/*\\\ EOF \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/