-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathDownsampler2x16Avx512.h
135 lines (73 loc) · 3.49 KB
/
Downsampler2x16Avx512.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
/*****************************************************************************
Downsampler2x16Avx512.h
Author: Laurent de Soras, 2020
Downsamples vectors of 16 float by a factor 2 the input signal, using AVX
instruction set.
This object must be aligned on a 64-byte boundary!
Template parameters:
- NC: number of coefficients, > 0
--- Legal stuff ---
This program is free software. It comes without any warranty, to
the extent permitted by applicable law. You can redistribute it
and/or modify it under the terms of the Do What The Fuck You Want
To Public License, Version 2, as published by Sam Hocevar. See
http://sam.zoy.org/wtfpl/COPYING for more details.
*Tab=3***********************************************************************/
#pragma once
#if ! defined (hiir_Downsampler2x16Avx512_HEADER_INCLUDED)
#define hiir_Downsampler2x16Avx512_HEADER_INCLUDED
#if defined (_MSC_VER)
#pragma warning (4 : 4250)
#endif
/*\\\ INCLUDE FILES \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
#include "hiir/def.h"
#include "hiir/StageDataAvx512.h"
#include <xmmintrin.h>
#include <array>
namespace hiir
{
template <int NC>
class Downsampler2x16Avx512
{
static_assert ((NC > 0), "Number of coefficient must be positive.");
/*\\\ PUBLIC \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
public:
typedef float DataType;
static const int _nbr_chn = 16;
enum { NBR_COEFS = NC };
Downsampler2x16Avx512 ();
Downsampler2x16Avx512 (const Downsampler2x16Avx512 <NC> &other) = default;
Downsampler2x16Avx512 (Downsampler2x16Avx512 <NC> &&other) = default;
~Downsampler2x16Avx512 () = default;
Downsampler2x16Avx512 <NC> &
operator = (const Downsampler2x16Avx512 <NC> &other) = default;
Downsampler2x16Avx512 <NC> &
operator = (Downsampler2x16Avx512 <NC> &&other) = default;
void set_coefs (const double coef_arr []);
hiir_FORCEINLINE __m512
process_sample (const float in_ptr [_nbr_chn * 2]);
hiir_FORCEINLINE __m512
process_sample (__m512 in_0, __m512 in_1);
void process_block (float out_ptr [], const float in_ptr [], long nbr_spl);
hiir_FORCEINLINE void
process_sample_split (__m512 &low, __m512 &high, const float in_ptr [_nbr_chn * 2]);
hiir_FORCEINLINE void
process_sample_split (__m512 &low, __m512 &high, __m512 in_0, __m512 in_1);
void process_block_split (float out_l_ptr [], float out_h_ptr [], const float in_ptr [], long nbr_spl);
void clear_buffers ();
/*\\\ PROTECTED \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
protected:
/*\\\ PRIVATE \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
// Stages 0 and 1 contain only input memories
typedef std::array <StageDataAvx512, NBR_COEFS + 2> Filter;
Filter _filter; // Should be the first member (thus easier to align)
/*\\\ FORBIDDEN MEMBER FUNCTIONS \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
bool operator == (const Downsampler2x16Avx512 <NC> &other) const = delete;
bool operator != (const Downsampler2x16Avx512 <NC> &other) const = delete;
}; // class Downsampler2x16Avx512
} // namespace hiir
#include "hiir/Downsampler2x16Avx512.hpp"
#endif // hiir_Downsampler2x16Avx512_HEADER_INCLUDED
/*\\\ EOF \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/