-
Notifications
You must be signed in to change notification settings - Fork 3
/
transpose-threads.h
81 lines (75 loc) · 4.07 KB
/
transpose-threads.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
/**
* Transpose functions.
*
* @author Kaushik Datta <[email protected]>
* @date 2019-08-06
*/
#ifndef TRANSPOSE_THREADS_H
#define TRANSPOSE_THREADS_H
#include <complex.h>
#include <stdlib.h>
void transpose_flt_thrrow(const float* restrict A, float* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_dbl_thrrow(const double* restrict A, double* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_fcmplx_thrrow(const float complex* restrict A,
float complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_dcmplx_thrrow(const double complex* restrict A,
double complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_flt_thrcol(const float* restrict A, float* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_dbl_thrcol(const double* restrict A, double* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_fcmplx_thrcol(const float complex* restrict A,
float complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_dcmplx_thrcol(const double complex* restrict A,
double complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr);
void transpose_flt_thrrow_blocked(const float* restrict A, float* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
void transpose_dbl_thrrow_blocked(const double* restrict A, double* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
void transpose_fcmplx_thrrow_blocked(const float complex* restrict A,
float complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
void transpose_dcmplx_thrrow_blocked(const double complex* restrict A,
double complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
void transpose_flt_thrcol_blocked(const float* restrict A, float* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
void transpose_dbl_thrcol_blocked(const double* restrict A, double* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
void transpose_fcmplx_thrcol_blocked(const float complex* restrict A,
float complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
void transpose_dcmplx_thrcol_blocked(const double complex* restrict A,
double complex* restrict B,
size_t A_rows, size_t A_cols,
size_t num_thr,
size_t blk_rows, size_t blk_cols);
#endif /* TRANSPOSE_THREADS_H */