Line | Branch | Exec | Source |
---|---|---|---|
1 | |||
2 | /* autogenerated from volk_8i_s32f_convert_32f_a_orc_impl.orc */ | ||
3 | |||
4 | #ifdef HAVE_CONFIG_H | ||
5 | #include "config.h" | ||
6 | #endif | ||
7 | #include <math.h> | ||
8 | |||
9 | #ifndef _ORC_INTEGER_TYPEDEFS_ | ||
10 | #define _ORC_INTEGER_TYPEDEFS_ | ||
11 | #if defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L | ||
12 | #include <stdint.h> | ||
13 | typedef int8_t orc_int8; | ||
14 | typedef int16_t orc_int16; | ||
15 | typedef int32_t orc_int32; | ||
16 | typedef int64_t orc_int64; | ||
17 | typedef uint8_t orc_uint8; | ||
18 | typedef uint16_t orc_uint16; | ||
19 | typedef uint32_t orc_uint32; | ||
20 | typedef uint64_t orc_uint64; | ||
21 | #define ORC_UINT64_C(x) UINT64_C(x) | ||
22 | #elif defined(_MSC_VER) | ||
23 | typedef signed __int8 orc_int8; | ||
24 | typedef signed __int16 orc_int16; | ||
25 | typedef signed __int32 orc_int32; | ||
26 | typedef signed __int64 orc_int64; | ||
27 | typedef unsigned __int8 orc_uint8; | ||
28 | typedef unsigned __int16 orc_uint16; | ||
29 | typedef unsigned __int32 orc_uint32; | ||
30 | typedef unsigned __int64 orc_uint64; | ||
31 | #define ORC_UINT64_C(x) (x##Ui64) | ||
32 | #define inline __inline | ||
33 | #else | ||
34 | #include <limits.h> | ||
35 | typedef signed char orc_int8; | ||
36 | typedef short orc_int16; | ||
37 | typedef int orc_int32; | ||
38 | typedef unsigned char orc_uint8; | ||
39 | typedef unsigned short orc_uint16; | ||
40 | typedef unsigned int orc_uint32; | ||
41 | #if INT_MAX == LONG_MAX | ||
42 | typedef long long orc_int64; | ||
43 | typedef unsigned long long orc_uint64; | ||
44 | #define ORC_UINT64_C(x) (x##ULL) | ||
45 | #else | ||
46 | typedef long orc_int64; | ||
47 | typedef unsigned long orc_uint64; | ||
48 | #define ORC_UINT64_C(x) (x##UL) | ||
49 | #endif | ||
50 | #endif | ||
51 | typedef union { orc_int16 i; orc_int8 x2[2]; } orc_union16; | ||
52 | typedef union { orc_int32 i; float f; orc_int16 x2[2]; orc_int8 x4[4]; } orc_union32; | ||
53 | typedef union { orc_int64 i; double f; orc_int32 x2[2]; float x2f[2]; orc_int16 x4[4]; } orc_union64; | ||
54 | #endif | ||
55 | #ifndef ORC_RESTRICT | ||
56 | #if defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L | ||
57 | #define ORC_RESTRICT restrict | ||
58 | #elif defined(__GNUC__) && __GNUC__ >= 4 | ||
59 | #define ORC_RESTRICT __restrict__ | ||
60 | #elif defined(_MSC_VER) | ||
61 | #define ORC_RESTRICT __restrict | ||
62 | #else | ||
63 | #define ORC_RESTRICT | ||
64 | #endif | ||
65 | #endif | ||
66 | |||
67 | #ifndef ORC_INTERNAL | ||
68 | #if defined(__SUNPRO_C) && (__SUNPRO_C >= 0x590) | ||
69 | #define ORC_INTERNAL __attribute__((visibility("hidden"))) | ||
70 | #elif defined(__SUNPRO_C) && (__SUNPRO_C >= 0x550) | ||
71 | #define ORC_INTERNAL __hidden | ||
72 | #elif defined (__GNUC__) | ||
73 | #define ORC_INTERNAL __attribute__((visibility("hidden"))) | ||
74 | #else | ||
75 | #define ORC_INTERNAL | ||
76 | #endif | ||
77 | #endif | ||
78 | |||
79 | |||
80 | #ifndef DISABLE_ORC | ||
81 | #include <orc/orc.h> | ||
82 | #endif | ||
83 | void volk_8i_s32f_convert_32f_a_orc_impl (orc_uint32 * ORC_RESTRICT d1, const orc_uint8 * ORC_RESTRICT s1, float p1, int n); | ||
84 | |||
85 | |||
86 | /* begin Orc C target preamble */ | ||
87 | #define ORC_CLAMP(x,a,b) ((x)<(a) ? (a) : ((x)>(b) ? (b) : (x))) | ||
88 | #define ORC_ABS(a) ((a)<0 ? -(a) : (a)) | ||
89 | #define ORC_MIN(a,b) ((a)<(b) ? (a) : (b)) | ||
90 | #define ORC_MAX(a,b) ((a)>(b) ? (a) : (b)) | ||
91 | #define ORC_SB_MAX 127 | ||
92 | #define ORC_SB_MIN (-1-ORC_SB_MAX) | ||
93 | #define ORC_UB_MAX (orc_uint8) 255 | ||
94 | #define ORC_UB_MIN 0 | ||
95 | #define ORC_SW_MAX 32767 | ||
96 | #define ORC_SW_MIN (-1-ORC_SW_MAX) | ||
97 | #define ORC_UW_MAX (orc_uint16)65535 | ||
98 | #define ORC_UW_MIN 0 | ||
99 | #define ORC_SL_MAX 2147483647 | ||
100 | #define ORC_SL_MIN (-1-ORC_SL_MAX) | ||
101 | #define ORC_UL_MAX 4294967295U | ||
102 | #define ORC_UL_MIN 0 | ||
103 | #define ORC_CLAMP_SB(x) ORC_CLAMP(x,ORC_SB_MIN,ORC_SB_MAX) | ||
104 | #define ORC_CLAMP_UB(x) ORC_CLAMP(x,ORC_UB_MIN,ORC_UB_MAX) | ||
105 | #define ORC_CLAMP_SW(x) ORC_CLAMP(x,ORC_SW_MIN,ORC_SW_MAX) | ||
106 | #define ORC_CLAMP_UW(x) ORC_CLAMP(x,ORC_UW_MIN,ORC_UW_MAX) | ||
107 | #define ORC_CLAMP_SL(x) ORC_CLAMP(x,ORC_SL_MIN,ORC_SL_MAX) | ||
108 | #define ORC_CLAMP_UL(x) ORC_CLAMP(x,ORC_UL_MIN,ORC_UL_MAX) | ||
109 | #define ORC_SWAP_W(x) ((((x)&0xffU)<<8) | (((x)&0xff00U)>>8)) | ||
110 | #define ORC_SWAP_L(x) ((((x)&0xffU)<<24) | (((x)&0xff00U)<<8) | (((x)&0xff0000U)>>8) | (((x)&0xff000000U)>>24)) | ||
111 | #define ORC_SWAP_Q(x) ((((x)&ORC_UINT64_C(0xff))<<56) | (((x)&ORC_UINT64_C(0xff00))<<40) | (((x)&ORC_UINT64_C(0xff0000))<<24) | (((x)&ORC_UINT64_C(0xff000000))<<8) | (((x)&ORC_UINT64_C(0xff00000000))>>8) | (((x)&ORC_UINT64_C(0xff0000000000))>>24) | (((x)&ORC_UINT64_C(0xff000000000000))>>40) | (((x)&ORC_UINT64_C(0xff00000000000000))>>56)) | ||
112 | #define ORC_PTR_OFFSET(ptr,offset) ((void *)(((unsigned char *)(ptr)) + (offset))) | ||
113 | #define ORC_DENORMAL(x) ((x) & ((((x)&0x7f800000) == 0) ? 0xff800000 : 0xffffffff)) | ||
114 | #define ORC_ISNAN(x) ((((x)&0x7f800000) == 0x7f800000) && (((x)&0x007fffff) != 0)) | ||
115 | #define ORC_DENORMAL_DOUBLE(x) ((x) & ((((x)&ORC_UINT64_C(0x7ff0000000000000)) == 0) ? ORC_UINT64_C(0xfff0000000000000) : ORC_UINT64_C(0xffffffffffffffff))) | ||
116 | #define ORC_ISNAN_DOUBLE(x) ((((x)&ORC_UINT64_C(0x7ff0000000000000)) == ORC_UINT64_C(0x7ff0000000000000)) && (((x)&ORC_UINT64_C(0x000fffffffffffff)) != 0)) | ||
117 | #ifndef ORC_RESTRICT | ||
118 | #if defined(__STDC_VERSION__) && __STDC_VERSION__ >= 199901L | ||
119 | #define ORC_RESTRICT restrict | ||
120 | #elif defined(__GNUC__) && __GNUC__ >= 4 | ||
121 | #define ORC_RESTRICT __restrict__ | ||
122 | #else | ||
123 | #define ORC_RESTRICT | ||
124 | #endif | ||
125 | #endif | ||
126 | /* end Orc C target preamble */ | ||
127 | |||
128 | |||
129 | |||
130 | /* volk_8i_s32f_convert_32f_a_orc_impl */ | ||
131 | #ifdef DISABLE_ORC | ||
132 | void | ||
133 | volk_8i_s32f_convert_32f_a_orc_impl (orc_uint32 * ORC_RESTRICT d1, const orc_uint8 * ORC_RESTRICT s1, float p1, int n){ | ||
134 | int i; | ||
135 | orc_union32 * ORC_RESTRICT ptr0; | ||
136 | const orc_int8 * ORC_RESTRICT ptr4; | ||
137 | orc_int8 var35; | ||
138 | orc_union32 var36; | ||
139 | orc_union32 var37; | ||
140 | orc_union16 var38; | ||
141 | orc_union32 var39; | ||
142 | orc_union32 var40; | ||
143 | |||
144 | ptr0 = (orc_union32 *)d1; | ||
145 | ptr4 = (orc_int8 *)s1; | ||
146 | |||
147 | /* 4: loadpl */ | ||
148 | var36.f = p1; | ||
149 | |||
150 | for (i = 0; i < n; i++) { | ||
151 | /* 0: loadb */ | ||
152 | var35 = ptr4[i]; | ||
153 | /* 1: convsbw */ | ||
154 | var38.i = var35; | ||
155 | /* 2: convswl */ | ||
156 | var39.i = var38.i; | ||
157 | /* 3: convlf */ | ||
158 | var40.f = var39.i; | ||
159 | /* 5: mulf */ | ||
160 | { | ||
161 | orc_union32 _src1; | ||
162 | orc_union32 _src2; | ||
163 | orc_union32 _dest1; | ||
164 | _src1.i = ORC_DENORMAL(var40.i); | ||
165 | _src2.i = ORC_DENORMAL(var36.i); | ||
166 | _dest1.f = _src1.f * _src2.f; | ||
167 | var37.i = ORC_DENORMAL(_dest1.i); | ||
168 | } | ||
169 | /* 6: storel */ | ||
170 | ptr0[i] = var37; | ||
171 | } | ||
172 | |||
173 | } | ||
174 | |||
175 | #else | ||
176 | static void | ||
177 | ✗ | _backup_volk_8i_s32f_convert_32f_a_orc_impl (OrcExecutor * ORC_RESTRICT ex) | |
178 | { | ||
179 | int i; | ||
180 | ✗ | int n = ex->n; | |
181 | orc_union32 * ORC_RESTRICT ptr0; | ||
182 | const orc_int8 * ORC_RESTRICT ptr4; | ||
183 | orc_int8 var35; | ||
184 | orc_union32 var36; | ||
185 | orc_union32 var37; | ||
186 | orc_union16 var38; | ||
187 | orc_union32 var39; | ||
188 | orc_union32 var40; | ||
189 | |||
190 | ✗ | ptr0 = (orc_union32 *)ex->arrays[0]; | |
191 | ✗ | ptr4 = (orc_int8 *)ex->arrays[4]; | |
192 | |||
193 | /* 4: loadpl */ | ||
194 | ✗ | var36.i = ex->params[24]; | |
195 | |||
196 | ✗ | for (i = 0; i < n; i++) { | |
197 | /* 0: loadb */ | ||
198 | ✗ | var35 = ptr4[i]; | |
199 | /* 1: convsbw */ | ||
200 | ✗ | var38.i = var35; | |
201 | /* 2: convswl */ | ||
202 | ✗ | var39.i = var38.i; | |
203 | /* 3: convlf */ | ||
204 | ✗ | var40.f = var39.i; | |
205 | /* 5: mulf */ | ||
206 | { | ||
207 | orc_union32 _src1; | ||
208 | orc_union32 _src2; | ||
209 | orc_union32 _dest1; | ||
210 | ✗ | _src1.i = ORC_DENORMAL(var40.i); | |
211 | ✗ | _src2.i = ORC_DENORMAL(var36.i); | |
212 | ✗ | _dest1.f = _src1.f * _src2.f; | |
213 | ✗ | var37.i = ORC_DENORMAL(_dest1.i); | |
214 | } | ||
215 | /* 6: storel */ | ||
216 | ✗ | ptr0[i] = var37; | |
217 | } | ||
218 | |||
219 | ✗ | } | |
220 | |||
221 | void | ||
222 | 2 | volk_8i_s32f_convert_32f_a_orc_impl (orc_uint32 * ORC_RESTRICT d1, const orc_uint8 * ORC_RESTRICT s1, float p1, int n) | |
223 | { | ||
224 | 2 | OrcExecutor _ex, *ex = &_ex; | |
225 | static volatile int p_inited = 0; | ||
226 | static OrcCode *c = 0; | ||
227 | void (*func) (OrcExecutor *); | ||
228 | |||
229 |
1/2✓ Branch 0 taken 2 times.
✗ Branch 1 not taken.
|
2 | if (!p_inited) { |
230 | 2 | orc_once_mutex_lock (); | |
231 |
1/2✓ Branch 0 taken 2 times.
✗ Branch 1 not taken.
|
2 | if (!p_inited) { |
232 | OrcProgram *p; | ||
233 | |||
234 | #if 1 | ||
235 | static const orc_uint8 bc[] = { | ||
236 | 1, 9, 35, 118, 111, 108, 107, 95, 56, 105, 95, 115, 51, 50, 102, 95, | ||
237 | 99, 111, 110, 118, 101, 114, 116, 95, 51, 50, 102, 95, 97, 95, 111, 114, | ||
238 | 99, 95, 105, 109, 112, 108, 11, 4, 4, 12, 1, 1, 17, 4, 20, 4, | ||
239 | 20, 4, 20, 2, 149, 34, 4, 153, 33, 34, 211, 32, 33, 202, 0, 32, | ||
240 | 24, 2, 0, | ||
241 | }; | ||
242 | 2 | p = orc_program_new_from_static_bytecode (bc); | |
243 | 2 | orc_program_set_backup_function (p, _backup_volk_8i_s32f_convert_32f_a_orc_impl); | |
244 | #else | ||
245 | p = orc_program_new (); | ||
246 | orc_program_set_name (p, "volk_8i_s32f_convert_32f_a_orc_impl"); | ||
247 | orc_program_set_backup_function (p, _backup_volk_8i_s32f_convert_32f_a_orc_impl); | ||
248 | orc_program_add_destination (p, 4, "d1"); | ||
249 | orc_program_add_source (p, 1, "s1"); | ||
250 | orc_program_add_parameter_float (p, 4, "p1"); | ||
251 | orc_program_add_temporary (p, 4, "t1"); | ||
252 | orc_program_add_temporary (p, 4, "t2"); | ||
253 | orc_program_add_temporary (p, 2, "t3"); | ||
254 | |||
255 | orc_program_append_2 (p, "convsbw", 0, ORC_VAR_T3, ORC_VAR_S1, ORC_VAR_D1, ORC_VAR_D1); | ||
256 | orc_program_append_2 (p, "convswl", 0, ORC_VAR_T2, ORC_VAR_T3, ORC_VAR_D1, ORC_VAR_D1); | ||
257 | orc_program_append_2 (p, "convlf", 0, ORC_VAR_T1, ORC_VAR_T2, ORC_VAR_D1, ORC_VAR_D1); | ||
258 | orc_program_append_2 (p, "mulf", 0, ORC_VAR_D1, ORC_VAR_T1, ORC_VAR_P1, ORC_VAR_D1); | ||
259 | #endif | ||
260 | |||
261 | 2 | orc_program_compile (p); | |
262 | 2 | c = orc_program_take_code (p); | |
263 | 2 | orc_program_free (p); | |
264 | } | ||
265 | 2 | p_inited = TRUE; | |
266 | 2 | orc_once_mutex_unlock (); | |
267 | } | ||
268 | 2 | ex->arrays[ORC_VAR_A2] = c; | |
269 | 2 | ex->program = 0; | |
270 | |||
271 | 2 | ex->n = n; | |
272 | 2 | ex->arrays[ORC_VAR_D1] = d1; | |
273 | 2 | ex->arrays[ORC_VAR_S1] = (void *)s1; | |
274 | { | ||
275 | orc_union32 tmp; | ||
276 | 2 | tmp.f = p1; | |
277 | 2 | ex->params[ORC_VAR_P1] = tmp.i; | |
278 | } | ||
279 | |||
280 | 2 | func = c->exec; | |
281 | 2 | func (ex); | |
282 | 2 | } | |
283 | #endif | ||
284 | |||
285 | |||
286 |