-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathDownsampler2x4Neon.h
134 lines (72 loc) · 3.46 KB
/
Downsampler2x4Neon.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
/*****************************************************************************
Downsampler2x4Neon.h
Author: Laurent de Soras, 2016
Downsamples vectors of 4 float by a factor 2 the input signal, using NEON
instruction set.
This object must be aligned on a 16-byte boundary!
Template parameters:
- NC: number of coefficients, > 0
--- Legal stuff ---
This program is free software. It comes without any warranty, to
the extent permitted by applicable law. You can redistribute it
and/or modify it under the terms of the Do What The Fuck You Want
To Public License, Version 2, as published by Sam Hocevar. See
http://sam.zoy.org/wtfpl/COPYING for more details.
*Tab=3***********************************************************************/
#pragma once
#if ! defined (hiir_Downsampler2x4Neon_HEADER_INCLUDED)
#define hiir_Downsampler2x4Neon_HEADER_INCLUDED
#if defined (_MSC_VER)
#pragma warning (4 : 4250)
#endif
/*\\\ INCLUDE FILES \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
#include "hiir/def.h"
#include "hiir/StageDataNeonV4.h"
#include <arm_neon.h>
#include <array>
namespace hiir
{
template <int NC>
class Downsampler2x4Neon
{
static_assert ((NC > 0), "Number of coefficient must be positive.");
/*\\\ PUBLIC \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
public:
typedef float DataType;
static const int _nbr_chn = 4;
enum { NBR_COEFS = NC };
Downsampler2x4Neon ();
Downsampler2x4Neon (const Downsampler2x4Neon <NC> &other) = default;
Downsampler2x4Neon (Downsampler2x4Neon <NC> &&other) = default;
~Downsampler2x4Neon () = default;
Downsampler2x4Neon <NC> &
operator = (const Downsampler2x4Neon <NC> &other) = default;
Downsampler2x4Neon <NC> &
operator = (Downsampler2x4Neon <NC> &&other) = default;
void set_coefs (const double coef_arr []);
hiir_FORCEINLINE float32x4_t
process_sample (const float in_ptr [8]);
hiir_FORCEINLINE float32x4_t
process_sample (float32x4_t in_0, float32x4_t in_1);
void process_block (float out_ptr [], const float in_ptr [], long nbr_spl);
hiir_FORCEINLINE void
process_sample_split (float32x4_t &low, float32x4_t &high, const float in_ptr [8]);
hiir_FORCEINLINE void
process_sample_split (float32x4_t &low, float32x4_t &high, float32x4_t in_0, float32x4_t in_1);
void process_block_split (float out_l_ptr [], float out_h_ptr [], const float in_ptr [], long nbr_spl);
void clear_buffers ();
/*\\\ PROTECTED \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
protected:
/*\\\ PRIVATE \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
typedef std::array <StageDataNeonV4, NBR_COEFS + 2> Filter; // Stages 0 and 1 contain only input memories
Filter _filter; // Should be the first member (thus easier to align)
/*\\\ FORBIDDEN MEMBER FUNCTIONS \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/
private:
bool operator == (const Downsampler2x4Neon <NC> &other) const = delete;
bool operator != (const Downsampler2x4Neon <NC> &other) const = delete;
}; // class Downsampler2x4Neon
} // namespace hiir
#include "hiir/Downsampler2x4Neon.hpp"
#endif // hiir_Downsampler2x4Neon_HEADER_INCLUDED
/*\\\ EOF \\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\\*/