Wavelets/dwt_cpu.h at master · oshkosher/Wavelets · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
#ifndef __DWT_CPU_H__
#define __DWT_CPU_H__

#include "wavelet.h"
#include "cucheck.h"

#define CDF97_ANALYSIS_LOWPASS_FILTER_0  .85269867900940f
#define CDF97_ANALYSIS_LOWPASS_FILTER_1  .377402855612650f
#define CDF97_ANALYSIS_LOWPASS_FILTER_2 -.110624404418420f
#define CDF97_ANALYSIS_LOWPASS_FILTER_3 -.02384946501938f
#define CDF97_ANALYSIS_LOWPASS_FILTER_4  .037828455506995f

#define CDF97_ANALYSIS_HIGHPASS_FILTER_0 -.788485616405660f
#define CDF97_ANALYSIS_HIGHPASS_FILTER_1  .418092273222210f
#define CDF97_ANALYSIS_HIGHPASS_FILTER_2  .040689417609558f
#define CDF97_ANALYSIS_HIGHPASS_FILTER_3 -.064538882628938f

#define CDF97_SYNTHESIS_LOWPASS_FILTER_0  .788485616405660f
#define CDF97_SYNTHESIS_LOWPASS_FILTER_1  .377402855612650f
#define CDF97_SYNTHESIS_LOWPASS_FILTER_2 -.040689417609558f
#define CDF97_SYNTHESIS_LOWPASS_FILTER_3 -.02384946501938f

#define CDF97_SYNTHESIS_HIGHPASS_FILTER_0 -.85269867900940f
#define CDF97_SYNTHESIS_HIGHPASS_FILTER_1  .418092273222210f
#define CDF97_SYNTHESIS_HIGHPASS_FILTER_2  .110624404418420f
#define CDF97_SYNTHESIS_HIGHPASS_FILTER_3 -.064538882628938f
#define CDF97_SYNTHESIS_HIGHPASS_FILTER_4 -.037828455506995f

/*
  Simple implementation of a discrete wavelet transform using the CPU.
*/

unsigned countLeadingZeros(unsigned x);
unsigned ceilLog2(unsigned x);

// Returns the maximum number of steps a DWT can take for a given input length
// Is essentially ceil(log2(length))
int dwtMaximumSteps(int length);

bool is_padded_for_wavelet(int length, int steps);
bool is_padded_for_wavelet(scu_wavelet::int3 size, scu_wavelet::int3 steps);

// Transpose a square matrix.
void transpose_square(int size, float data[]);
void transpose_square(int size, double data[]);

/*
  Transpose an upper-left square of a square matrix.

  transpose_square_submatrix(4, 2, data):
    a b . .       a c . .
    c d . .   ->  b d . .
    . . . .       . . . .
    . . . .       . . . .

    All "." cells would be unchanged.
*/
void transpose_square_submatrix(int total_size, int submatrix_size,
                                float data[]);

template<class NUM>
void transpose_rect(NUM *dest, const NUM *src, int width, int height);

template<class NUM>
void transpose_rect(NUM *matrix, int width, int height);


// print a matrix (for debugging purposes)
void print_matrix(int width, int height, float *data);

// Haar wavelet filter on one row of data, and the inverse.
// stepCount is the number of passes over the data. Values <= 0 will
// result in ceil(log2(data)) passes.
void haar(int length, float data[], bool inverse = false,
          int stepCount = -1);
void haar(int length, double data[], bool inverse = false,
          int stepCount = -1);

// Haar wavelet transform. on a 2-d rectangle of data.
// Returns the time the operation took in milliseconds.
// Returns true on success, false if the data is not properly padded.
bool haar_2d(float *data, int width, int height, bool inverse = false,
             int stepCountX = -1, int stepCountY = -1);

bool haar_2d(double *data, int width, int height, bool inverse = false,
             int stepCountX = -1, int stepCountY = -1);

bool cdf97_2d(float *data, int width, int height, bool inverse = false,
              int stepCountX = -1, int stepCountY = -1);

bool cdf97_2d(double *data, int width, int height, bool inverse = false,
              int stepCountX = -1, int stepCountY = -1);

// 3-d Haar
void haar_3d(CubeFloat *data, scu_wavelet::int3 stepCount,
             bool inverse = false);

typedef enum {
  ZERO_FILL,  // fill pad elements with zero
  REFLECT,    // fill with reflection: abcde -> abcdedcb
  REPEAT      // fill with copies of last value: abcde->abcdeeee
} DWTPadding;


/*
  Given an input length, return that length rounded up to a length
  compatible with 'stepCount' steps of discrete wavelet transforms.
  If powerOfTwo is true, round up to a power of two. Otherwise,
  round up to a multiple of 2^stepCount. Return the rounded up length.
*/
int dwt_padded_length(int length, int stepCount, bool powerOfTwo);


/*
  Pad an array to the given length with the given padding method.

  The output array is returned. If output is NULL, a new array will be
  allocated. If inputLen==0, then the output array will be zero-filled.
*/
float *dwt_pad(int inputLen, float input[],
	       int outputLen, float *output,
	       DWTPadding pad);
double *dwt_pad(int inputLen, double input[],
		int outputLen, double *output,
		DWTPadding pad);

float *dwt_pad_2d(int rows, int cols, int rowPitch, float *input,
		  int outputRows, int outputCols, int outputPitch,
		  float *output, DWTPadding pad);
double *dwt_pad_2d(int rows, int cols, int rowPitch, double *input,
		   int outputRows, int outputCols, int outputPitch,
		   double *output, DWTPadding pad);

// 1-d CDF 9.7 wavelet transform
void cdf97(int length, float *data, int stepCount, float *tempGiven = NULL);
void cdf97_inverse(int length, float *data, int stepCount, float *tempGiven = NULL);

// 3-d CDF 9.7
void cdf97_3d(CubeFloat *data, scu_wavelet::int3 stepCount,
              bool inverse = false, bool quiet = false);


/*
  Wrap an array such that if you reference values beyond the ends
  of the array, the results will be mirrored array values.

  For example, given an array with 7 elements: 0 1 2 3 4 5 6
  Request array[0..6] and you'll get the usual values array[0..6].
  array[-1] returns array[1], array[-2] return array[2], etc.
  array[7] returns array[5], array[8] return array[4], etc.
*/
template<class T>
class MirroredArray {
  int length;  // length of the actual data
  const T *array;

public:
  HD MirroredArray(int length_, const T *array_)
    : length(length_), array(array_) {}

  HD static int getOffset(int offset, int length) {

    // negative offset: mirror to a positive
    if (offset < 0) offset = -offset;

    // past the end: fold it back, repeat if necessary
    // try using modulo, see if it speeds this up
    while (offset >= length) {
      offset = length*2 - offset - 2;

      if (offset < 0) offset = -offset;
    }

    return offset;
  }


  HD T operator[] (int offset) const {
    return array[getOffset(offset, length)];
  }

  HD void setLength(int len) {length = len;}
};


/* An iterator that walks through a mirrored array
   for example, if the array is of length 3, and you start walking forward
   from 0:
   0, 1, 2, 1, 0, 1, 2, ...
*/
class MirroredIterator {
  int length, pos, direction;

 public:
  HD void init(int length_, int pos_) {
    length = length_;
    pos = pos_;

    // handle pathological cases gracefully
    if (length <= 1) {
      length = 1;
      pos = 0;
      direction = 0;
      return;
    }

    direction = 1;

    // if the position is off to the left, invert it at 0 and the direction
    if (pos < 0) {
      pos = -pos;
      direction = -direction;
    }

    while (pos >= length) {
      // if it's off to the right, invert it at (length-) and the direcion
      pos = length*2 - pos - 2;
      if (pos < 0) {
        // but if that throws it off the left, invert again at 0 but
        // leave direction unchanged
        pos = -pos;
      } else {
        direction = -direction;
      }
    }
  }

  HD int get() {return pos;}

  // postfix increment
  HD int operator++(int) {
    int prev = pos;
    pos += direction;

    // wrap negative values around to large positive values by
    // casting to usigned
    if ((unsigned)pos >= (unsigned)length) {
      direction = -direction;
      pos += (direction * 2);
    }

    return prev;
  }

  HD static int getOffset(int offset, int length) {

    // negative offset: mirror to a positive
    if (offset < 0) offset = -offset;

    // past the end: fold it back, repeat if necessary
    // try using modulo, see if it speeds this up
    while (offset >= length) {
      offset = length*2 - offset - 2;

      if (offset < 0) offset = -offset;
    }

    return offset;
  }

};


// Like MirroredArray, but simpler. Ask for an invalid index and you get 0.
template<class T>
class ZeroExtendedArray {
  T *array;
  int length;  // length of the actual data

public:
  HD ZeroExtendedArray(T *array_, int length_)
    : array(array_), length(length_) {}

  HD T operator[] (int offset) const {

    if (offset < 0 || offset >= length) return 0;

    return array[offset];
  }

  HD void setLength(int len) {length = len;}
};


#endif // __DWT_CPU_H__