FFTLIB User Guide
FFTLIB_UTIL_SE0AloadComputeC.h
Go to the documentation of this file.
1 /******************************************************************************/
5 /* Copyright (C) 2015 Texas Instruments Incorporated - https://www.ti.com/
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  *
11  * Redistributions of source code must retain the above copyright
12  * notice, this list of conditions and the following disclaimer.
13  *
14  * Redistributions in binary form must reproduce the above copyright
15  * notice, this list of conditions and the following disclaimer in the
16  * documentation and/or other materials provided with the
17  * distribution.
18  *
19  * Neither the name of Texas Instruments Incorporated nor the names of
20  * its contributors may be used to endorse or promote products derived
21  * from this software without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
24  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
25  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
26  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
27  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
28  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
29  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
30  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
31  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
32  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
33  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34  *
35  ******************************************************************************/
36 
37 #ifndef COMMON_FFTLIB_UTIL_SE0ALOADCOMPUTEC_H_
38 #define COMMON_FFTLIB_UTIL_SE0ALOADCOMPUTEC_H_ 1
39 
40 /*******************************************************************************
41  *
42  * INCLUDES
43  *
44  ******************************************************************************/
45 
46 
47 
48 
49 /******************************************************************************/
50 /******************************************************************************/
59 /******************************************************************************/
60 #ifdef __cplusplus
61 #pragma FUNC_ALWAYS_INLINE
62 #else
63 #pragma FUNC_ALWAYS_INLINE(FFTLIB_UTIL_SE0AloadComputeC)
64 #endif
65 static inline void FFTLIB_UTIL_SE0AloadComputeC(int32_t numRows)
66 {
67  int32_t r;
68 
69  for(r = 0; r < numRows; r++){
70  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
71  __HWALDA(valA);
72  __HWAOP(__MMA_A_LDA);
73  __HWAADV();
74  }
75 
76  return;
77 }
78 
79 #ifdef __cplusplus
80 #pragma FUNC_ALWAYS_INLINE
81 #else
82 #pragma FUNC_ALWAYS_INLINE(FFTLIB_UTIL_SE0AloadComputeC_unroll16)
83 #endif
84 static inline void FFTLIB_UTIL_SE0AloadComputeC_unroll16(int32_t numRows)
85 {
86  int32_t r;
87  FFTLIB_UNROLL(16)
88  for(r = 0; r < numRows; r++){
89  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
90  __HWALDA(valA);
91  __HWAOP(__MMA_A_LDA);
92  __HWAADV();
93  }
94 
95  return;
96 }
97 
98 #ifdef __cplusplus
99 #pragma FUNC_ALWAYS_INLINE
100 #else
101 #pragma FUNC_ALWAYS_INLINE(FFTLIB_UTIL_SE0AloadComputeC_unroll32)
102 #endif
103 static inline void FFTLIB_UTIL_SE0AloadComputeC_unroll32(int32_t numRows)
104 {
105  int32_t r;
106 
107  FFTLIB_UNROLL(32)
108  for(r = 0; r < numRows; r++){
109  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
110  __HWALDA(valA);
111  __HWAOP(__MMA_A_LDA);
112  __HWAADV();
113  }
114 
115  return;
116 }
117 
118 #ifdef __cplusplus
119 #pragma FUNC_ALWAYS_INLINE
120 #else
121 #pragma FUNC_ALWAYS_INLINE(FFTLIB_UTIL_SE0AloadComputeC_unroll64)
122 #endif
123 static inline void FFTLIB_UTIL_SE0AloadComputeC_unroll64(int32_t numRows)
124 {
125  int32_t r;
126 
127  FFTLIB_UNROLL(64)
128  for(r = 0; r < numRows; r++){
129  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
130  __HWALDA(valA);
131  __HWAOP(__MMA_A_LDA);
132  __HWAADV();
133  }
134 
135  return;
136 }
137 
138 #ifdef __cplusplus
139 #pragma FUNC_ALWAYS_INLINE
140 #else
141 #pragma FUNC_ALWAYS_INLINE(FFTLIB_UTIL_SE0AloadComputeC_unroll)
142 #endif
143 #ifdef __cplusplus
144 template <int32_t UNROLL_TIMES>
145 static inline void FFTLIB_UTIL_SE0AloadComputeC_unroll(int32_t numRows)
146 {
147  int32_t r;
148 
149  FFTLIB_UNROLL(UNROLL_TIMES)
150  for(r = 0; r < numRows; r++){
151  __mma_vec valA = c7x::strm_eng<0, __mma_vec>::get_adv();
152  __HWALDA(valA);
153  __HWAOP(__MMA_A_LDA);
154  __HWAADV();
155  }
156 
157  return;
158 }
159 #endif
160 #endif /* COMMON_FFTLIB_UTIL_SE0ALOADCOMPUTEC_H_ */
static void FFTLIB_UTIL_SE0AloadComputeC(int32_t numRows)
use streaming engine 0 to load numRows of A compute C(row) = A(row) x Bfore(:,:)
static void FFTLIB_UTIL_SE0AloadComputeC_unroll16(int32_t numRows)
static void FFTLIB_UTIL_SE0AloadComputeC_unroll32(int32_t numRows)
static void FFTLIB_UTIL_SE0AloadComputeC_unroll64(int32_t numRows)