FFTLIB User Guide
FFTLIB_UTIL_SE0AloadSE1BloadComputeC.h
Go to the documentation of this file.
1 /******************************************************************************/
5 /* Copyright (C) 2015 Texas Instruments Incorporated - https://www.ti.com/
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  *
11  * Redistributions of source code must retain the above copyright
12  * notice, this list of conditions and the following disclaimer.
13  *
14  * Redistributions in binary form must reproduce the above copyright
15  * notice, this list of conditions and the following disclaimer in the
16  * documentation and/or other materials provided with the
17  * distribution.
18  *
19  * Neither the name of Texas Instruments Incorporated nor the names of
20  * its contributors may be used to endorse or promote products derived
21  * from this software without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
24  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
25  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
26  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
27  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
28  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
29  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
30  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
31  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
32  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
33  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34  *
35  ******************************************************************************/
36 
37 #ifndef COMMON_FFTLIB_UTIL_SE0ALOADSE1BLOADCOMPUTEC_H_
38 #define COMMON_FFTLIB_UTIL_SE0ALOADSE1BLOADCOMPUTEC_H_ 1
39 
40 /*******************************************************************************
41  *
42  * INCLUDES
43  *
44  ******************************************************************************/
45 
46 
47 
48 
49 /******************************************************************************/
50 
51 /******************************************************************************/
59 /******************************************************************************/
61 static inline void FFTLIB_UTIL_SE0AloadSE1BloadComputeC(int32_t numRows)
62 {
63  int32_t r;
64  _nassert(numRows > 0);
65  for(r = 0; r < numRows; r++){
66  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
67  __mma_vec valB = c7x::strm_eng<1, __mma_vec>::get_adv();
68  __HWALDAB(valA, valB);
69  __HWAOP(__MMA_A_LDA);
70  __HWAADV();
71  }
72  return;
73 }
74 
76 static inline void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll16(int32_t numRows)
77 {
78  int32_t r;
79 
80  FFTLIB_UNROLL(16)
81  for(r = 0; r < numRows; r++){
82  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
83  __mma_vec valB = c7x::strm_eng<1, __mma_vec>::get_adv();
84  __HWALDAB(valA, valB);
85  __HWAOP(__MMA_A_LDA);
86  __HWAADV();
87  }
88  return;
89 }
90 
92 static inline void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll32(int32_t numRows)
93 {
94  int32_t r;
95 
96  FFTLIB_UNROLL(32)
97  for(r = 0; r < numRows; r++){
98  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
99  __mma_vec valB = c7x::strm_eng<1, __mma_vec>::get_adv();
100  __HWALDAB(valA, valB);
101  __HWAOP(__MMA_A_LDA);
102  __HWAADV();
103  }
104  return;
105 }
106 
108 static inline void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll64(int32_t numRows)
109 {
110  int32_t r;
111 
112  FFTLIB_UNROLL(64)
113  for(r = 0; r < numRows; r++){
114  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
115  __mma_vec valB = c7x::strm_eng<1, __mma_vec>::get_adv();
116  __HWALDAB(valA, valB);
117  __HWAOP(__MMA_A_LDA);
118  __HWAADV();
119  }
120  return;
121 }
122 
123 #ifdef __cplusplus
124 __INLINE_FUNC(FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll)
125 template <int32_t UNROLL_TIMES>
126 static inline void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll(int32_t numRows)
127 {
128  int32_t r;
129 
130  FFTLIB_UNROLL(UNROLL_TIMES)
131  for(r = 0; r < numRows; r++){
132  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
133  __mma_vec valB = c7x::strm_eng<1, __mma_vec>::get_adv();
134  __HWALDAB(valA, valB);
135  __HWAOP(__MMA_A_LDA);
136  __HWAADV();
137  }
138  return;
139 }
140 #endif
141 
142 #ifdef __cplusplus
143 __INLINE_FUNC(FFTLIB_UTIL_SE0AloadSE1BloadComputeC_peel)
144 template <int32_t UNROLL_TIMES>
145 static inline void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_peel(int32_t numRows, int32_t peelSize)
146 {
147  int32_t r;
148 
149  FFTLIB_UNROLL(UNROLL_TIMES)
150  for(r = 0; r < peelSize; r++){
151  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
152  __mma_vec valB = c7x::strm_eng<1, __mma_vec>::get_adv();
153  __HWALDAB(valA, valB);
154  __HWAOP(__MMA_A_LDA);
155  __HWAADV();
156  }
157 
158  _nassert(numRows > 0);
159  for(r = peelSize; r < numRows; r++){
160  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
161  __mma_vec valB = c7x::strm_eng<1, __mma_vec>::get_adv();
162  __HWALDAB(valA, valB);
163  __HWAOP(__MMA_A_LDA);
164  __HWAADV();
165  }
166  return;
167 }
168 #endif
169 #endif /* COMMON_FFTLIB_UTIL_SE0ALOADSE1BLOADCOMPUTEC_H_ */
static void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll16(int32_t numRows)
static void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll32(int32_t numRows)
static void FFTLIB_UTIL_SE0AloadSE1BloadComputeC_unroll64(int32_t numRows)
static void FFTLIB_UTIL_SE0AloadSE1BloadComputeC(int32_t numRows)
#define __INLINE_FUNC(x)
Definition: FFTLIB_types.h:67