DSPLIB User Guide
DSPLIB_sqr_ci.cpp
Go to the documentation of this file.
1 /******************************************************************************/
5 /* Copyright (C) 2017 Texas Instruments Incorporated - https://www.ti.com/
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions
9  * are met:
10  *
11  * Redistributions of source code must retain the above copyright
12  * notice, this list of conditions and the following disclaimer.
13  *
14  * Redistributions in binary form must reproduce the above copyright
15  * notice, this list of conditions and the following disclaimer in the
16  * documentation and/or other materials provided with the
17  * distribution.
18  *
19  * Neither the name of Texas Instruments Incorporated nor the names of
20  * its contributors may be used to endorse or promote products derived
21  * from this software without specific prior written permission.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
24  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
25  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
26  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
27  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
28  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
29  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
30  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
31  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
32  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
33  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34  *
35  ******************************************************************************/
36 
37 /******************************************************************************
38  * Version 1.0 Date 10/2/22 Author: Asheesh Bhardwaj
39  *****************************************************************************/
40 
41 /*******************************************************************************
42  *
43  * INCLUDES
44  *
45  ******************************************************************************/
46 
47 #include "../common/c71/DSPLIB_inlines.h"
48 #include "DSPLIB_sqr_priv.h"
49 #include <float.h>
50 
51 /*******************************************************************************
52  *
53  * DEFINES
54  *
55  ******************************************************************************/
56 #define SE_PARAM_BASE (0x0000)
57 #define SE_SE0_PARAM_OFFSET (SE_PARAM_BASE)
58 #define SE_SA0_PARAM_OFFSET (SE_SE0_PARAM_OFFSET + SE_PARAM_SIZE)
59 
60 template <typename dataType>
62  const DSPLIB_bufParams1D_t *bufParamsIn,
63  const DSPLIB_bufParams1D_t *bufParamsOut,
64  const DSPLIB_sqr_InitArgs *pKerInitArgs)
65 {
67  DSPLIB_sqr_PrivArgs *pKerPrivArgs = (DSPLIB_sqr_PrivArgs *) handle;
68  uint32_t blockSize = pKerPrivArgs->blockSize;
69 
70  __SE_TEMPLATE_v1 se0Params;
71  __SA_TEMPLATE_v1 sa0Params;
72 
73  __SE_ELETYPE SE_ELETYPE;
74  __SE_VECLEN SE_VECLEN;
75  __SA_VECLEN SA_VECLEN;
76 
77  uint8_t *pBlock = pKerPrivArgs->bufPblock;
78 
79  typedef typename c7x::make_full_vector<dataType>::type vec;
80  SE_VECLEN = c7x::se_veclen<vec>::value;
81  SA_VECLEN = c7x::sa_veclen<vec>::value;
82  SE_ELETYPE = c7x::se_eletype<vec>::value;
83 
84 #if DSPLIB_DEBUGPRINT
85  int32_t eleCount = c7x::element_count_of<vec>::value;
86  printf("Enter eleCount %d\n", eleCount);
87 #endif
88 
89  /**********************************************************************/
90  /* Prepare streaming engine 1 to fetch the input */
91  /**********************************************************************/
92  se0Params = __gen_SE_TEMPLATE_v1();
93 
94  se0Params.ICNT0 = blockSize;
95  se0Params.ELETYPE = SE_ELETYPE;
96  se0Params.VECLEN = SE_VECLEN;
97  se0Params.DIMFMT = __SE_DIMFMT_1D;
98 
99  /**********************************************************************/
100  /* Prepare SA template to store output */
101  /**********************************************************************/
102  sa0Params = __gen_SA_TEMPLATE_v1();
103 
104  sa0Params.ICNT0 = blockSize;
105  sa0Params.DIM1 = blockSize;
106  sa0Params.VECLEN = SA_VECLEN;
107  sa0Params.DIMFMT = __SA_DIMFMT_1D;
108 
109  *(__SE_TEMPLATE_v1 *) ((uint8_t *) pBlock + SE_SE0_PARAM_OFFSET) = se0Params;
110  *(__SA_TEMPLATE_v1 *) ((uint8_t *) pBlock + SE_SA0_PARAM_OFFSET) = sa0Params;
111 
112  return status;
113 }
114 
116  const DSPLIB_bufParams1D_t *bufParamsIn,
117  const DSPLIB_bufParams1D_t *bufParamsOut,
118  const DSPLIB_sqr_InitArgs *pKerInitArgs);
119 
121  const DSPLIB_bufParams1D_t *bufParamsIn,
122  const DSPLIB_bufParams1D_t *bufParamsOut,
123  const DSPLIB_sqr_InitArgs *pKerInitArgs);
124 
126  const DSPLIB_bufParams1D_t *bufParamsIn,
127  const DSPLIB_bufParams1D_t *bufParamsOut,
128  const DSPLIB_sqr_InitArgs *pKerInitArgs);
129 
131  const DSPLIB_bufParams1D_t *bufParamsIn,
132  const DSPLIB_bufParams1D_t *bufParamsOut,
133  const DSPLIB_sqr_InitArgs *pKerInitArgs);
134 
136  const DSPLIB_bufParams1D_t *bufParamsIn,
137  const DSPLIB_bufParams1D_t *bufParamsOut,
138  const DSPLIB_sqr_InitArgs *pKerInitArgs);
139 
141  const DSPLIB_bufParams1D_t *bufParamsIn,
142  const DSPLIB_bufParams1D_t *bufParamsOut,
143  const DSPLIB_sqr_InitArgs *pKerInitArgs);
144 
146  const DSPLIB_bufParams1D_t *bufParamsIn,
147  const DSPLIB_bufParams1D_t *bufParamsOut,
148  const DSPLIB_sqr_InitArgs *pKerInitArgs);
149 
151  const DSPLIB_bufParams1D_t *bufParamsIn,
152  const DSPLIB_bufParams1D_t *bufParamsOut,
153  const DSPLIB_sqr_InitArgs *pKerInitArgs);
154 
155 template <typename dataType, int32_t dataIn>
156 DSPLIB_STATUS DSPLIB_sqr_exec_ci(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
157 {
158  DSPLIB_sqr_PrivArgs *pKerPrivArgs = (DSPLIB_sqr_PrivArgs *) handle;
159  uint32_t blockSize = pKerPrivArgs->blockSize;
160 
161  __SE_TEMPLATE_v1 se0Params;
162  __SA_TEMPLATE_v1 sa0Params;
163 
164  dataType *restrict pInLocal = (dataType *) pIn;
165  dataType *restrict pOutLocal = (dataType *) pOut;
166 
167 #if DSPLIB_DEBUGPRINT
168  printf("Enter DSPLIB_sqr_exec_ci\n");
169 #endif
170 
171  typedef typename c7x::make_full_vector<dataType>::type vec;
172  int32_t eleCount = c7x::element_count_of<vec>::value;
173 
174 #if DSPLIB_DEBUGPRINT
175  printf("Enter eleCount %d\n", eleCount);
176 #endif
177 
178  uint8_t *pBlock = pKerPrivArgs->bufPblock;
179 
180  se0Params = *(__SE_TEMPLATE_v1 *) ((uint8_t *) pBlock + SE_SE0_PARAM_OFFSET);
181  sa0Params = *(__SA_TEMPLATE_v1 *) ((uint8_t *) pBlock + SE_SA0_PARAM_OFFSET);
182  // Input samples
183  __SE0_OPEN(pInLocal, se0Params);
184 
185  // Output samples
186  __SA0_OPEN(sa0Params);
187 
188 #if DSPLIB_DEBUGPRINT
189  printf("DSPLIB_DEBUGPRINT blockSize %d\n", blockSize);
190 #endif
191 
192  vec out;
193  for (int32_t counter = 0; counter < blockSize; counter += eleCount) {
194  vec a = c7x::strm_eng<0, vec>::get_adv();
195 
196  out = a * a;
197 
198  __vpred tmp = c7x::strm_agen<0, vec>::get_vpred();
199  vec *VB1 = c7x::strm_agen<0, vec>::get_adv(pOutLocal);
200 
201  __vstore_pred(tmp, VB1, out);
202  }
203  __SE0_CLOSE();
204  __SE1_CLOSE();
205  __SA0_CLOSE();
206 
207  return DSPLIB_SUCCESS;
208 }
209 
211 DSPLIB_sqr_exec_ci<float, DSPLIB_FLOAT32>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
212 
214 DSPLIB_sqr_exec_ci<double, DSPLIB_FLOAT64>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
215 
217 DSPLIB_sqr_exec_ci<int8_t, DSPLIB_INT8>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
218 
220 DSPLIB_sqr_exec_ci<uint8_t, DSPLIB_UINT8>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
221 
223 DSPLIB_sqr_exec_ci<int16_t, DSPLIB_INT16>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
224 
226 DSPLIB_sqr_exec_ci<uint16_t, DSPLIB_UINT16>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
227 
229 DSPLIB_sqr_exec_ci<int32_t, DSPLIB_INT32>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
230 
232 DSPLIB_sqr_exec_ci<uint32_t, DSPLIB_UINT32>(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut);
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< int32_t, DSPLIB_INT32 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
template DSPLIB_STATUS DSPLIB_sqr_init_ci< uint8_t >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
DSPLIB_STATUS DSPLIB_sqr_init_ci(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
This function is the initialization function for the C7x implementation of the kernel....
template DSPLIB_STATUS DSPLIB_sqr_init_ci< double >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
#define SE_SE0_PARAM_OFFSET
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< int16_t, DSPLIB_INT16 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< float, DSPLIB_FLOAT32 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< uint16_t, DSPLIB_UINT16 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
template DSPLIB_STATUS DSPLIB_sqr_init_ci< int8_t >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
template DSPLIB_STATUS DSPLIB_sqr_init_ci< uint16_t >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< uint8_t, DSPLIB_UINT8 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< int8_t, DSPLIB_INT8 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
template DSPLIB_STATUS DSPLIB_sqr_init_ci< int32_t >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
template DSPLIB_STATUS DSPLIB_sqr_init_ci< uint32_t >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
DSPLIB_STATUS DSPLIB_sqr_exec_ci(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
This function is the main execution function for the C7x implementation of the kernel....
template DSPLIB_STATUS DSPLIB_sqr_init_ci< float >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< double, DSPLIB_FLOAT64 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
template DSPLIB_STATUS DSPLIB_sqr_init_ci< int16_t >(DSPLIB_kernelHandle handle, const DSPLIB_bufParams1D_t *bufParamsIn, const DSPLIB_bufParams1D_t *bufParamsOut, const DSPLIB_sqr_InitArgs *pKerInitArgs)
template DSPLIB_STATUS DSPLIB_sqr_exec_ci< uint32_t, DSPLIB_UINT32 >(DSPLIB_kernelHandle handle, void *restrict pIn, void *restrict pOut)
#define SE_SA0_PARAM_OFFSET
Header file for kernel's internal use. For the kernel's interface, please see DSPLIB_sqr.
DSPLIB_STATUS_NAME
The enumeration of all status codes.
Definition: DSPLIB_types.h:151
void * DSPLIB_kernelHandle
Handle type for DSPLIB operations.
Definition: DSPLIB_types.h:172
@ DSPLIB_SUCCESS
Definition: DSPLIB_types.h:152
A structure for a 1 dimensional buffer descriptor.
Structure containing the parameters to initialize the kernel.
Definition: DSPLIB_sqr.h:105
Structure that is reserved for internal use by the kernel.
int32_t blockSize
Size of input buffer for different batches DSPLIB_sqr_init that will be retrieved and used by DSPLIB_...
uint8_t bufPblock[DSPLIB_SQR_IXX_IXX_OXX_PBLOCK_SIZE]